First Push

25b1a56 verified 3 months ago

17.5 kB

	{
	"name": "root",
	"gauges": {
	"SnowballTarget.Policy.Entropy.mean": {
	"value": 0.5065417289733887,
	"min": 0.49549272656440735,
	"max": 2.813369035720825,
	"count": 30
	},
	"SnowballTarget.Policy.Entropy.sum": {
	"value": 4858.74853515625,
	"min": 4858.74853515625,
	"max": 28718.87109375,
	"count": 30
	},
	"SnowballTarget.Step.mean": {
	"value": 499952.0,
	"min": 209936.0,
	"max": 499952.0,
	"count": 30
	},
	"SnowballTarget.Step.sum": {
	"value": 499952.0,
	"min": 209936.0,
	"max": 499952.0,
	"count": 30
	},
	"SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
	"value": 13.20620059967041,
	"min": 2.071056842803955,
	"max": 13.317708015441895,
	"count": 30
	},
	"SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
	"value": 2694.06494140625,
	"min": 393.50079345703125,
	"max": 2705.673828125,
	"count": 30
	},
	"SnowballTarget.Losses.PolicyLoss.mean": {
	"value": 0.06573672673260386,
	"min": 0.06349465119602232,
	"max": 0.07748843980131342,
	"count": 30
	},
	"SnowballTarget.Losses.PolicyLoss.sum": {
	"value": 0.32868363366301934,
	"min": 0.2594767195506553,
	"max": 0.37172240696336123,
	"count": 30
	},
	"SnowballTarget.Losses.ValueLoss.mean": {
	"value": 0.17950843812203873,
	"min": 0.1739506449039076,
	"max": 0.2768958347539107,
	"count": 30
	},
	"SnowballTarget.Losses.ValueLoss.sum": {
	"value": 0.8975421906101937,
	"min": 0.6958025796156304,
	"max": 1.3364396822803162,
	"count": 30
	},
	"SnowballTarget.Policy.LearningRate.mean": {
	"value": 3.0288989903999985e-06,
	"min": 3.0288989903999985e-06,
	"max": 0.0001766088411304,
	"count": 30
	},
	"SnowballTarget.Policy.LearningRate.sum": {
	"value": 1.5144494951999991e-05,
	"min": 1.5144494951999991e-05,
	"max": 0.000853344215552,
	"count": 30
	},
	"SnowballTarget.Policy.Epsilon.mean": {
	"value": 0.1010096,
	"min": 0.1010096,
	"max": 0.1588696,
	"count": 30
	},
	"SnowballTarget.Policy.Epsilon.sum": {
	"value": 0.505048,
	"min": 0.4119584,
	"max": 0.784448,
	"count": 30
	},
	"SnowballTarget.Policy.Beta.mean": {
	"value": 1.0908639999999999e-05,
	"min": 1.0908639999999999e-05,
	"max": 6.298264e-05,
	"count": 30
	},
	"SnowballTarget.Policy.Beta.sum": {
	"value": 5.4543199999999996e-05,
	"min": 5.0762560000000005e-05,
	"max": 0.00030600320000000007,
	"count": 30
	},
	"SnowballTarget.Environment.EpisodeLength.mean": {
	"value": 199.0,
	"min": 199.0,
	"max": 199.0,
	"count": 30
	},
	"SnowballTarget.Environment.EpisodeLength.sum": {
	"value": 10945.0,
	"min": 8756.0,
	"max": 10945.0,
	"count": 30
	},
	"SnowballTarget.Environment.CumulativeReward.mean": {
	"value": 25.472727272727273,
	"min": 5.090909090909091,
	"max": 26.21818181818182,
	"count": 30
	},
	"SnowballTarget.Environment.CumulativeReward.sum": {
	"value": 1401.0,
	"min": 224.0,
	"max": 1442.0,
	"count": 30
	},
	"SnowballTarget.Policy.ExtrinsicReward.mean": {
	"value": 25.472727272727273,
	"min": 5.090909090909091,
	"max": 26.21818181818182,
	"count": 30
	},
	"SnowballTarget.Policy.ExtrinsicReward.sum": {
	"value": 1401.0,
	"min": 224.0,
	"max": 1442.0,
	"count": 30
	},
	"SnowballTarget.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 30
	},
	"SnowballTarget.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 30
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1773664937",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --resume --no-graphics",
	"mlagents_version": "1.1.0",
	"mlagents_envs_version": "1.1.0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.10.0+cu128",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1773665602"
	},
	"total": 665.0540399700003,
	"count": 1,
	"self": 0.6973311459996694,
	"children": {
	"run_training.setup": {
	"total": 0.039469952000217745,
	"count": 1,
	"self": 0.039469952000217745
	},
	"TrainerController.start_learning": {
	"total": 664.3172388720004,
	"count": 1,
	"self": 0.4871282610538401,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.3383428580000327,
	"count": 1,
	"self": 2.3383428580000327
	},
	"TrainerController.advance": {
	"total": 658.9868647379471,
	"count": 27264,
	"self": 0.5162136149492653,
	"children": {
	"env_step": {
	"total": 462.7353537499994,
	"count": 27264,
	"self": 354.8981654089739,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 107.53536951897786,
	"count": 27264,
	"self": 1.8760541230203671,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 105.65931539595749,
	"count": 27264,
	"self": 105.65931539595749
	}
	}
	},
	"workers": {
	"total": 0.3018188220476077,
	"count": 27264,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 658.0246860219531,
	"count": 27264,
	"is_parallel": true,
	"self": 344.6093568760225,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0029834299994035973,
	"count": 1,
	"is_parallel": true,
	"self": 0.0008881549983925652,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.002095275001011032,
	"count": 10,
	"is_parallel": true,
	"self": 0.002095275001011032
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.03488423700036947,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005924939996475587,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00036805099989578594,
	"count": 1,
	"is_parallel": true,
	"self": 0.00036805099989578594
	},
	"communicator.exchange": {
	"total": 0.03205556900047668,
	"count": 1,
	"is_parallel": true,
	"self": 0.03205556900047668
	},
	"steps_from_proto": {
	"total": 0.001868123000349442,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003917840012945817,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014763389990548603,
	"count": 10,
	"is_parallel": true,
	"self": 0.0014763389990548603
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 313.4153291459306,
	"count": 27263,
	"is_parallel": true,
	"self": 14.76222867101933,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 8.029466016941115,
	"count": 27263,
	"is_parallel": true,
	"self": 8.029466016941115
	},
	"communicator.exchange": {
	"total": 236.13212464500702,
	"count": 27263,
	"is_parallel": true,
	"self": 236.13212464500702
	},
	"steps_from_proto": {
	"total": 54.49150981296316,
	"count": 27263,
	"is_parallel": true,
	"self": 9.97395067870093,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 44.51755913426223,
	"count": 272630,
	"is_parallel": true,
	"self": 44.51755913426223
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 195.7352973729985,
	"count": 27264,
	"self": 0.6209096390075501,
	"children": {
	"process_trajectory": {
	"total": 52.91728896898803,
	"count": 27264,
	"self": 39.97520039498704,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 12.94208857400099,
	"count": 6,
	"self": 12.94208857400099
	}
	}
	},
	"_update_policy": {
	"total": 142.19709876500292,
	"count": 136,
	"self": 55.1479849309535,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 87.04911383404942,
	"count": 6933,
	"self": 87.04911383404942
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.0049998309114017e-06,
	"count": 1,
	"self": 1.0049998309114017e-06
	},
	"TrainerController._save_models": {
	"total": 2.5049020099995687,
	"count": 1,
	"self": 0.0008557359997212188,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 2.5040462739998475,
	"count": 1,
	"self": 2.5040462739998475
	}
	}
	}
	}
	}
	}
	}