First Push

b091756 verified over 1 year ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.41119223833084106,
	"min": 0.41119223833084106,
	"max": 1.471925973892212,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 12151.552734375,
	"min": 12151.552734375,
	"max": 44652.34765625,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989883.0,
	"min": 29952.0,
	"max": 989883.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989883.0,
	"min": 29952.0,
	"max": 989883.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.427590012550354,
	"min": -0.31348738074302673,
	"max": 0.5430094003677368,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 113.31135559082031,
	"min": -74.2965087890625,
	"max": 150.41360473632812,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.030404971912503242,
	"min": -0.011679602786898613,
	"max": 0.35483700037002563,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 8.057317733764648,
	"min": -3.1184539794921875,
	"max": 85.16088104248047,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06963869239373527,
	"min": 0.06418292059690567,
	"max": 0.07342489732537676,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9749416935122938,
	"min": 0.5139742812776373,
	"max": 1.0415133859085686,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.014876755937567558,
	"min": 0.00016056364700314042,
	"max": 0.016039063518941736,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.20827458312594582,
	"min": 0.0020873274110408254,
	"max": 0.2245468892651843,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.750233130907146e-06,
	"min": 7.750233130907146e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010850326383270003,
	"min": 0.00010850326383270003,
	"max": 0.0036090432969856,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10258337857142859,
	"min": 0.10258337857142859,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4361673000000001,
	"min": 1.3886848,
	"max": 2.569091400000001,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0002680795192857144,
	"min": 0.0002680795192857144,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.003753113270000002,
	"min": 0.003753113270000002,
	"max": 0.12031113856,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.013370824977755547,
	"min": 0.013067224994301796,
	"max": 0.44320252537727356,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.18719154596328735,
	"min": 0.18294115364551544,
	"max": 3.1024177074432373,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 431.6857142857143,
	"min": 359.5365853658537,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30218.0,
	"min": 15984.0,
	"max": 33444.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.4825685461716993,
	"min": -1.0000000521540642,
	"max": 1.5938626305166497,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 103.77979823201895,
	"min": -31.99320162832737,
	"max": 132.29059833288193,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.4825685461716993,
	"min": -1.0000000521540642,
	"max": 1.5938626305166497,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 103.77979823201895,
	"min": -31.99320162832737,
	"max": 132.29059833288193,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.06012799181376717,
	"min": 0.047820723676599605,
	"max": 9.20178209245205,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 4.208959426963702,
	"min": 3.9691200651577674,
	"max": 147.2285134792328,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1716267205",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.2.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1716270872"
	},
	"total": 3666.491618387001,
	"count": 1,
	"self": 0.6056720080014202,
	"children": {
	"run_training.setup": {
	"total": 0.08369009099988034,
	"count": 1,
	"self": 0.08369009099988034
	},
	"TrainerController.start_learning": {
	"total": 3665.8022562879996,
	"count": 1,
	"self": 2.5587414731307945,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.3099131639992265,
	"count": 1,
	"self": 4.3099131639992265
	},
	"TrainerController.advance": {
	"total": 3658.8384550078717,
	"count": 63591,
	"self": 2.6622956246756075,
	"children": {
	"env_step": {
	"total": 2455.0247556050854,
	"count": 63591,
	"self": 2269.795731178263,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 183.6438605799558,
	"count": 63591,
	"self": 8.054882045929844,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 175.58897853402596,
	"count": 62569,
	"self": 175.58897853402596
	}
	}
	},
	"workers": {
	"total": 1.5851638468666351,
	"count": 63591,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 3658.4097298003308,
	"count": 63591,
	"is_parallel": true,
	"self": 1598.6894520580572,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0034536969997134292,
	"count": 1,
	"is_parallel": true,
	"self": 0.0011708140027621994,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.00228288299695123,
	"count": 8,
	"is_parallel": true,
	"self": 0.00228288299695123
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.07880420999936177,
	"count": 1,
	"is_parallel": true,
	"self": 0.0009447929987800308,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0003980229994340334,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003980229994340334
	},
	"communicator.exchange": {
	"total": 0.07514179099962348,
	"count": 1,
	"is_parallel": true,
	"self": 0.07514179099962348
	},
	"steps_from_proto": {
	"total": 0.0023196030015242286,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004996620009478647,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0018199410005763639,
	"count": 8,
	"is_parallel": true,
	"self": 0.0018199410005763639
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 2059.7202777422735,
	"count": 63590,
	"is_parallel": true,
	"self": 54.83721629233514,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 30.524886827221053,
	"count": 63590,
	"is_parallel": true,
	"self": 30.524886827221053
	},
	"communicator.exchange": {
	"total": 1835.700426211004,
	"count": 63590,
	"is_parallel": true,
	"self": 1835.700426211004
	},
	"steps_from_proto": {
	"total": 138.65774841171333,
	"count": 63590,
	"is_parallel": true,
	"self": 30.40246924056919,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 108.25527917114414,
	"count": 508720,
	"is_parallel": true,
	"self": 108.25527917114414
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1201.1514037781108,
	"count": 63591,
	"self": 5.0563354261230415,
	"children": {
	"process_trajectory": {
	"total": 186.4566107019691,
	"count": 63591,
	"self": 186.15627448797022,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.30033621399888943,
	"count": 2,
	"self": 0.30033621399888943
	}
	}
	},
	"_update_policy": {
	"total": 1009.6384576500186,
	"count": 453,
	"self": 395.337199764821,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 614.3012578851976,
	"count": 22749,
	"self": 614.3012578851976
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.2519994925241917e-06,
	"count": 1,
	"self": 1.2519994925241917e-06
	},
	"TrainerController._save_models": {
	"total": 0.09514539099836838,
	"count": 1,
	"self": 0.001965040997674805,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.09318035000069358,
	"count": 1,
	"self": 0.09318035000069358
	}
	}
	}
	}
	}
	}
	}