First Push

05a7fc3 verified about 1 year ago

18.4 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.998950719833374,
	"min": 0.9001078605651855,
	"max": 1.4380332231521606,
	"count": 13
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 30256.21875,
	"min": 26960.03125,
	"max": 43624.17578125,
	"count": 13
	},
	"Pyramids.Step.mean": {
	"value": 389922.0,
	"min": 29952.0,
	"max": 389922.0,
	"count": 13
	},
	"Pyramids.Step.sum": {
	"value": 389922.0,
	"min": 29952.0,
	"max": 389922.0,
	"count": 13
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.04003271833062172,
	"min": -0.270123153924942,
	"max": 0.04003271833062172,
	"count": 13
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 9.968147277832031,
	"min": -64.0191879272461,
	"max": 9.968147277832031,
	"count": 13
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.03113975003361702,
	"min": 0.03113975003361702,
	"max": 0.33837276697158813,
	"count": 13
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 7.75379753112793,
	"min": 7.75379753112793,
	"max": 81.20946502685547,
	"count": 13
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.07138317823434492,
	"min": 0.06532376273643901,
	"max": 0.07496527767407479,
	"count": 13
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9993644952808289,
	"min": 0.5247569437185235,
	"max": 0.9993978770180985,
	"count": 13
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.005047186439996159,
	"min": 0.0006489568515479398,
	"max": 0.00795678350329263,
	"count": 13
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.07066061015994622,
	"min": 0.009085395921671157,
	"max": 0.07066061015994622,
	"count": 13
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 0.00018756205176504283,
	"min": 0.00018756205176504283,
	"max": 0.00029515063018788575,
	"count": 13
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.0026258687247105996,
	"min": 0.0020660544113152,
	"max": 0.0035081708306098002,
	"count": 13
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.16252067142857143,
	"min": 0.16252067142857143,
	"max": 0.19838354285714285,
	"count": 13
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 2.2752894,
	"min": 1.3886848,
	"max": 2.5693902,
	"count": 13
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.006255815075714286,
	"min": 0.006255815075714286,
	"max": 0.00983851593142857,
	"count": 13
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.08758141106,
	"min": 0.06886961152,
	"max": 0.11696208098000001,
	"count": 13
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.026629071682691574,
	"min": 0.026629071682691574,
	"max": 0.5501084923744202,
	"count": 13
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.37280699610710144,
	"min": 0.37280699610710144,
	"max": 3.850759267807007,
	"count": 13
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 817.1891891891892,
	"min": 817.1891891891892,
	"max": 999.0,
	"count": 13
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30236.0,
	"min": 15984.0,
	"max": 32383.0,
	"count": 13
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 0.1554540216520026,
	"min": -1.0000000521540642,
	"max": 0.1554540216520026,
	"count": 13
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 5.751798801124096,
	"min": -30.374401703476906,
	"max": 5.751798801124096,
	"count": 13
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 0.1554540216520026,
	"min": -1.0000000521540642,
	"max": 0.1554540216520026,
	"count": 13
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 5.751798801124096,
	"min": -30.374401703476906,
	"max": 5.751798801124096,
	"count": 13
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.2267604800841041,
	"min": 0.2267604800841041,
	"max": 11.075799133628607,
	"count": 13
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 8.390137763111852,
	"min": 8.390137763111852,
	"max": 177.2127861380577,
	"count": 13
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 13
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 13
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1739707764",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.6.0+cu124",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1739708387"
	},
	"total": 623.555400056,
	"count": 1,
	"self": 0.207407645000103,
	"children": {
	"run_training.setup": {
	"total": 0.0207760230000531,
	"count": 1,
	"self": 0.0207760230000531
	},
	"TrainerController.start_learning": {
	"total": 623.3272163879999,
	"count": 1,
	"self": 0.5804582989712799,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.128190472999904,
	"count": 1,
	"self": 2.128190472999904
	},
	"TrainerController.advance": {
	"total": 620.6185676160287,
	"count": 24668,
	"self": 0.35215339301498716,
	"children": {
	"env_step": {
	"total": 381.4078416239993,
	"count": 24668,
	"self": 326.8474191459836,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 54.282723165007155,
	"count": 24668,
	"self": 1.6065761640165874,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 52.67614700099057,
	"count": 24493,
	"self": 52.67614700099057
	}
	}
	},
	"workers": {
	"total": 0.2776993130084975,
	"count": 24668,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 621.8310794920035,
	"count": 24668,
	"is_parallel": true,
	"self": 328.1429784449724,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0020393869999679737,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007243360000757093,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013150509998922644,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013150509998922644
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.03658156300002702,
	"count": 1,
	"is_parallel": true,
	"self": 0.00034424299997226626,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00032593700007055304,
	"count": 1,
	"is_parallel": true,
	"self": 0.00032593700007055304
	},
	"communicator.exchange": {
	"total": 0.03484145399988847,
	"count": 1,
	"is_parallel": true,
	"self": 0.03484145399988847
	},
	"steps_from_proto": {
	"total": 0.0010699290000957262,
	"count": 1,
	"is_parallel": true,
	"self": 0.000244267999960357,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0008256610001353692,
	"count": 8,
	"is_parallel": true,
	"self": 0.0008256610001353692
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 293.68810104703107,
	"count": 24667,
	"is_parallel": true,
	"self": 7.555183527048712,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 5.121828956032232,
	"count": 24667,
	"is_parallel": true,
	"self": 5.121828956032232
	},
	"communicator.exchange": {
	"total": 258.0160779459791,
	"count": 24667,
	"is_parallel": true,
	"self": 258.0160779459791
	},
	"steps_from_proto": {
	"total": 22.995010617971047,
	"count": 24667,
	"is_parallel": true,
	"self": 4.918657078003889,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 18.076353539967158,
	"count": 197336,
	"is_parallel": true,
	"self": 18.076353539967158
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 238.7443043300143,
	"count": 24668,
	"self": 1.4473783860100866,
	"children": {
	"process_trajectory": {
	"total": 42.442379013004484,
	"count": 24668,
	"self": 42.442379013004484
	},
	"_update_policy": {
	"total": 194.85454693099973,
	"count": 163,
	"self": 107.04484613799445,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 87.80970079300528,
	"count": 8920,
	"self": 87.80970079300528
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.3240000953373965e-06,
	"count": 1,
	"self": 1.3240000953373965e-06
	},
	"TrainerController._save_models": {
	"total": 0.11426694500005397,
	"count": 1,
	"self": 0.0014725500000167813,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.11279439500003718,
	"count": 1,
	"self": 0.11279439500003718
	}
	}
	}
	}
	}
	}
	}
	}
	}