First Push

8bf5538 verified 9 months ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.4622722864151001,
	"min": 0.4622722864151001,
	"max": 1.4122027158737183,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 13927.33984375,
	"min": 13927.33984375,
	"max": 42840.58203125,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989879.0,
	"min": 29952.0,
	"max": 989879.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989879.0,
	"min": 29952.0,
	"max": 989879.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.35350170731544495,
	"min": -0.10640081763267517,
	"max": 0.39934098720550537,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 94.38495635986328,
	"min": -25.536195755004883,
	"max": 107.42272186279297,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": -0.17795561254024506,
	"min": -0.17795561254024506,
	"max": 0.4715794324874878,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": -47.5141487121582,
	"min": -47.5141487121582,
	"max": 113.17906188964844,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06763381216421015,
	"min": 0.06658038241481076,
	"max": 0.07475794741404432,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9468733702989421,
	"min": 0.4930598800095338,
	"max": 1.074437445572888,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.019851038272453294,
	"min": 0.0001938182260281338,
	"max": 0.019851038272453294,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.2779145358143461,
	"min": 0.0021320004863094716,
	"max": 0.2779145358143461,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.4923617882928594e-06,
	"min": 7.4923617882928594e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010489306503610003,
	"min": 0.00010489306503610003,
	"max": 0.0032555667148112004,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10249742142857143,
	"min": 0.10249742142857143,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4349639,
	"min": 1.3691136000000002,
	"max": 2.4851888000000004,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00025949240071428576,
	"min": 0.00025949240071428576,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0036328936100000005,
	"min": 0.0036328936100000005,
	"max": 0.10855036112,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.016493918374180794,
	"min": 0.016493918374180794,
	"max": 0.5968176126480103,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.2309148609638214,
	"min": 0.2309148609638214,
	"max": 4.177723407745361,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 454.7692307692308,
	"min": 435.6029411764706,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 29560.0,
	"min": 15984.0,
	"max": 33389.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.3913599745585368,
	"min": -1.0000000521540642,
	"max": 1.3913599745585368,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 90.4383983463049,
	"min": -32.000001668930054,
	"max": 90.4383983463049,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.3913599745585368,
	"min": -1.0000000521540642,
	"max": 1.3913599745585368,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 90.4383983463049,
	"min": -32.000001668930054,
	"max": 90.4383983463049,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.07740243841365624,
	"min": 0.07740243841365624,
	"max": 11.64180552214384,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 5.031158496887656,
	"min": 5.031158496887656,
	"max": 186.26888835430145,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1749455508",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.7.1+cu126",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1749457767"
	},
	"total": 2258.4939164939997,
	"count": 1,
	"self": 0.5258019509997212,
	"children": {
	"run_training.setup": {
	"total": 0.019741220000014437,
	"count": 1,
	"self": 0.019741220000014437
	},
	"TrainerController.start_learning": {
	"total": 2257.948373323,
	"count": 1,
	"self": 1.3365377329751027,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.1942436159999943,
	"count": 1,
	"self": 2.1942436159999943
	},
	"TrainerController.advance": {
	"total": 2254.334103334025,
	"count": 63489,
	"self": 1.37891215493255,
	"children": {
	"env_step": {
	"total": 1587.1077853630695,
	"count": 63489,
	"self": 1434.6823327779944,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 151.65833729303904,
	"count": 63489,
	"self": 4.605442787028551,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 147.0528945060105,
	"count": 62555,
	"self": 147.0528945060105
	}
	}
	},
	"workers": {
	"total": 0.7671152920361237,
	"count": 63489,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2252.8565510119906,
	"count": 63489,
	"is_parallel": true,
	"self": 930.3695335799537,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0018889430000399443,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006038980002358585,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012850449998040858,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012850449998040858
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.0553759430001719,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005180250002467801,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0004817110000203684,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004817110000203684
	},
	"communicator.exchange": {
	"total": 0.05265008099991064,
	"count": 1,
	"is_parallel": true,
	"self": 0.05265008099991064
	},
	"steps_from_proto": {
	"total": 0.0017261259999941103,
	"count": 1,
	"is_parallel": true,
	"self": 0.00035342800015314424,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001372697999840966,
	"count": 8,
	"is_parallel": true,
	"self": 0.001372697999840966
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1322.487017432037,
	"count": 63488,
	"is_parallel": true,
	"self": 31.618346542983545,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 22.866671464011915,
	"count": 63488,
	"is_parallel": true,
	"self": 22.866671464011915
	},
	"communicator.exchange": {
	"total": 1172.5197741640293,
	"count": 63488,
	"is_parallel": true,
	"self": 1172.5197741640293
	},
	"steps_from_proto": {
	"total": 95.48222526101222,
	"count": 63488,
	"is_parallel": true,
	"self": 19.236276070954546,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 76.24594919005767,
	"count": 507904,
	"is_parallel": true,
	"self": 76.24594919005767
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 665.847405816023,
	"count": 63489,
	"self": 2.525921006986664,
	"children": {
	"process_trajectory": {
	"total": 127.4534642450351,
	"count": 63489,
	"self": 127.2476142080352,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.20585003699989102,
	"count": 2,
	"self": 0.20585003699989102
	}
	}
	},
	"_update_policy": {
	"total": 535.8680205640012,
	"count": 444,
	"self": 297.2262207399767,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 238.64179982402447,
	"count": 22818,
	"self": 238.64179982402447
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.2150003385613672e-06,
	"count": 1,
	"self": 1.2150003385613672e-06
	},
	"TrainerController._save_models": {
	"total": 0.08348742499993023,
	"count": 1,
	"self": 0.0013612739999189216,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.0821261510000113,
	"count": 1,
	"self": 0.0821261510000113
	}
	}
	}
	}
	}
	}
	}