First Push

8dfb21e almost 3 years ago

20.6 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 2.8534560203552246,
	"min": 0.6876733303070068,
	"max": 3.2957088947296143,
	"count": 977
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 49399.03125,
	"min": 9473.9580078125,
	"max": 119219.5546875,
	"count": 977
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 999.0,
	"min": 383.9230769230769,
	"max": 999.0,
	"count": 977
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19980.0,
	"min": 15568.0,
	"max": 24904.0,
	"count": 977
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1165.607650045886,
	"min": 1163.1255753867908,
	"max": 1200.4353352507048,
	"count": 151
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 2331.215300091772,
	"min": 2326.2511507735817,
	"max": 21251.307919762614,
	"count": 151
	},
	"SoccerTwos.Step.mean": {
	"value": 9769694.0,
	"min": 9070.0,
	"max": 9769694.0,
	"count": 977
	},
	"SoccerTwos.Step.sum": {
	"value": 9769694.0,
	"min": 9070.0,
	"max": 9769694.0,
	"count": 977
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.0018585395300760865,
	"min": -0.02852208912372589,
	"max": 0.03621601313352585,
	"count": 977
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 0.01858539506793022,
	"min": -0.38130223751068115,
	"max": 0.5431860685348511,
	"count": 977
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.0019360113656148314,
	"min": -0.03305850178003311,
	"max": 0.03623698651790619,
	"count": 977
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 0.019360113888978958,
	"min": -0.36394256353378296,
	"max": 0.5434552431106567,
	"count": 977
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 977
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 977
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.0,
	"min": -0.5333333333333333,
	"max": 0.32597143203020096,
	"count": 977
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 0.0,
	"min": -8.831599980592728,
	"max": 4.563600048422813,
	"count": 977
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.0,
	"min": -0.5333333333333333,
	"max": 0.32597143203020096,
	"count": 977
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 0.0,
	"min": -8.831599980592728,
	"max": 4.563600048422813,
	"count": 977
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 977
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 977
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.01617720452947348,
	"min": 0.009041061301347023,
	"max": 0.023895814525894822,
	"count": 447
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.01617720452947348,
	"min": 0.009041061301347023,
	"max": 0.023895814525894822,
	"count": 447
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 4.3075555424820775e-07,
	"min": 3.796161938037409e-11,
	"max": 0.007123635763612886,
	"count": 447
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 4.3075555424820775e-07,
	"min": 3.796161938037409e-11,
	"max": 0.007123635763612886,
	"count": 447
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 3.827969493386263e-07,
	"min": 5.499825155482381e-11,
	"max": 0.006830077370007833,
	"count": 447
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 3.827969493386263e-07,
	"min": 5.499825155482381e-11,
	"max": 0.006830077370007833,
	"count": 447
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 447
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 447
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 447
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.20000000000000007,
	"max": 0.20000000000000007,
	"count": 447
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 447
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005000000000000001,
	"max": 0.005000000000000001,
	"count": 447
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1682399581",
	"python_version": "3.8.12 \| packaged by conda-forge \| (default, Sep 29 2021, 19:50:30) \n[GCC 9.4.0]",
	"command_line_arguments": "/home/jason/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos.exe --run-id=SoccerTwos --no-graphics --resume",
	"mlagents_version": "0.29.0.dev0",
	"mlagents_envs_version": "0.29.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.0",
	"numpy_version": "1.23.0",
	"end_time_seconds": "1682440720"
	},
	"total": 41139.5746951662,
	"count": 1,
	"self": 0.0036629438400268555,
	"children": {
	"run_training.setup": {
	"total": 0.018018901348114014,
	"count": 1,
	"self": 0.018018901348114014
	},
	"TrainerController.start_learning": {
	"total": 41139.55301332101,
	"count": 1,
	"self": 10.091750759631395,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.643025405704975,
	"count": 49,
	"self": 6.643025405704975
	},
	"TrainerController.advance": {
	"total": 41122.42403576523,
	"count": 635792,
	"self": 10.281007185578346,
	"children": {
	"env_step": {
	"total": 38821.82201176509,
	"count": 635792,
	"self": 36708.06962808967,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 2107.2789623625576,
	"count": 635792,
	"self": 54.651243790984154,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 2052.6277185715735,
	"count": 1263618,
	"self": 444.1418619453907,
	"children": {
	"TorchPolicy.sample_actions": {
	"total": 1608.4858566261828,
	"count": 1263618,
	"self": 1608.4858566261828
	}
	}
	}
	}
	},
	"workers": {
	"total": 6.473421312868595,
	"count": 635792,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 41122.94743762538,
	"count": 635792,
	"is_parallel": true,
	"self": 5543.7823835499585,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0022903084754943848,
	"count": 2,
	"is_parallel": true,
	"self": 0.00048452243208885193,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0018057860434055328,
	"count": 8,
	"is_parallel": true,
	"self": 0.0018057860434055328
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.06328035518527031,
	"count": 1,
	"is_parallel": true,
	"self": 0.00015142560005187988,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0015549026429653168,
	"count": 1,
	"is_parallel": true,
	"self": 0.0015549026429653168
	},
	"communicator.exchange": {
	"total": 0.059748053550720215,
	"count": 1,
	"is_parallel": true,
	"self": 0.059748053550720215
	},
	"steps_from_proto": {
	"total": 0.001825973391532898,
	"count": 2,
	"is_parallel": true,
	"self": 0.0003262721002101898,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014997012913227081,
	"count": 8,
	"is_parallel": true,
	"self": 0.0014997012913227081
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 35579.07395424321,
	"count": 635791,
	"is_parallel": true,
	"self": 98.12249110639095,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 805.0765328742564,
	"count": 635791,
	"is_parallel": true,
	"self": 805.0765328742564
	},
	"communicator.exchange": {
	"total": 33494.981812007725,
	"count": 635791,
	"is_parallel": true,
	"self": 33494.981812007725
	},
	"steps_from_proto": {
	"total": 1180.8931182548404,
	"count": 1271582,
	"is_parallel": true,
	"self": 197.63392517343163,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 983.2591930814087,
	"count": 5086328,
	"is_parallel": true,
	"self": 983.2591930814087
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.09109983220696449,
	"count": 96,
	"is_parallel": true,
	"self": 0.015366911888122559,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.07573292031884193,
	"count": 384,
	"is_parallel": true,
	"self": 0.07573292031884193
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 2290.3210168145597,
	"count": 635792,
	"self": 69.18487022817135,
	"children": {
	"process_trajectory": {
	"total": 697.5770987719297,
	"count": 635792,
	"self": 690.940976947546,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 6.636121824383736,
	"count": 19,
	"self": 6.636121824383736
	}
	}
	},
	"_update_policy": {
	"total": 1523.5590478144586,
	"count": 448,
	"self": 751.0578964203596,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 772.501151394099,
	"count": 13420,
	"self": 772.501151394099
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 9.350478649139404e-07,
	"count": 1,
	"self": 9.350478649139404e-07
	},
	"TrainerController._save_models": {
	"total": 0.3942004553973675,
	"count": 1,
	"self": 0.0013845190405845642,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.3928159363567829,
	"count": 1,
	"self": 0.3928159363567829
	}
	}
	}
	}
	}
	}
	}