ppo-PyramidsTraining / run_logs /timers.json

First Push

405e4db verified over 1 year ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.6160495281219482,
	"min": 0.6093841195106506,
	"max": 1.3897463083267212,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 18599.767578125,
	"min": 18408.275390625,
	"max": 42159.34375,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989914.0,
	"min": 29996.0,
	"max": 989914.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989914.0,
	"min": 29996.0,
	"max": 989914.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.43479880690574646,
	"min": -0.12259074300527573,
	"max": 0.535243570804596,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 116.96087646484375,
	"min": -29.176597595214844,
	"max": 146.65673828125,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.06376861035823822,
	"min": -0.01667921617627144,
	"max": 0.36044588685035706,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 17.153757095336914,
	"min": -4.403313159942627,
	"max": 86.86746215820312,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06726242829366433,
	"min": 0.06489429489726992,
	"max": 0.07389396612208136,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9416739961113005,
	"min": 0.5274496376786197,
	"max": 1.0647492395316174,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.012002619287938745,
	"min": 0.0003404957719820241,
	"max": 0.015414567366471081,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.16803667003114242,
	"min": 0.004065029767002356,
	"max": 0.21607641108372871,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.4099475300499955e-06,
	"min": 7.4099475300499955e-06,
	"max": 0.00029484945171685004,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010373926542069994,
	"min": 0.00010373926542069994,
	"max": 0.0033826604724466,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10246995000000002,
	"min": 0.10246995000000002,
	"max": 0.19828315000000002,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4345793000000002,
	"min": 1.4345793000000002,
	"max": 2.5275534000000004,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0002567480049999999,
	"min": 0.0002567480049999999,
	"max": 0.009828486684999999,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0035944720699999985,
	"min": 0.0035944720699999985,
	"max": 0.11278258466000002,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.00805074255913496,
	"min": 0.00805074255913496,
	"max": 0.541143536567688,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.11271040141582489,
	"min": 0.11271040141582489,
	"max": 4.329148292541504,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 424.6764705882353,
	"min": 360.8433734939759,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 28878.0,
	"min": 16283.0,
	"max": 32752.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.3693940985728712,
	"min": -0.9999375520274043,
	"max": 1.5668481766100388,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 93.11879870295525,
	"min": -31.998001664876938,
	"max": 130.04839865863323,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.3693940985728712,
	"min": -0.9999375520274043,
	"max": 1.5668481766100388,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 93.11879870295525,
	"min": -31.998001664876938,
	"max": 130.04839865863323,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.03584493006158428,
	"min": 0.0338602943366242,
	"max": 11.280355455244289,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.4374552441877313,
	"min": 2.4374552441877313,
	"max": 191.7660427391529,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1727024589",
	"python_version": "3.10.12 (main, Sep 11 2024, 15:47:36) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.4.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1727026822"
	},
	"total": 2233.4375273699998,
	"count": 1,
	"self": 0.48962489599989567,
	"children": {
	"run_training.setup": {
	"total": 0.05216245900010108,
	"count": 1,
	"self": 0.05216245900010108
	},
	"TrainerController.start_learning": {
	"total": 2232.895740015,
	"count": 1,
	"self": 1.3713316260009378,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.1563812039998993,
	"count": 1,
	"self": 2.1563812039998993
	},
	"TrainerController.advance": {
	"total": 2229.303511764999,
	"count": 63627,
	"self": 1.3527722009916943,
	"children": {
	"env_step": {
	"total": 1429.588737249014,
	"count": 63627,
	"self": 1324.996720927954,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 103.76874994705668,
	"count": 63627,
	"self": 4.608621051025693,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 99.16012889603098,
	"count": 62561,
	"self": 99.16012889603098
	}
	}
	},
	"workers": {
	"total": 0.8232663740034241,
	"count": 63627,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2227.981373906985,
	"count": 63627,
	"is_parallel": true,
	"self": 1021.0219533739696,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.002621614999952726,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007389169998077705,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0018826980001449556,
	"count": 8,
	"is_parallel": true,
	"self": 0.0018826980001449556
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.1002839259999746,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006602199998724245,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00044013599995196273,
	"count": 1,
	"is_parallel": true,
	"self": 0.00044013599995196273
	},
	"communicator.exchange": {
	"total": 0.0923262840001371,
	"count": 1,
	"is_parallel": true,
	"self": 0.0923262840001371
	},
	"steps_from_proto": {
	"total": 0.006857286000013119,
	"count": 1,
	"is_parallel": true,
	"self": 0.00036737199980052537,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.006489914000212593,
	"count": 8,
	"is_parallel": true,
	"self": 0.006489914000212593
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1206.9594205330154,
	"count": 63626,
	"is_parallel": true,
	"self": 33.06978756404874,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 22.50551274498116,
	"count": 63626,
	"is_parallel": true,
	"self": 22.50551274498116
	},
	"communicator.exchange": {
	"total": 1057.0431491099962,
	"count": 63626,
	"is_parallel": true,
	"self": 1057.0431491099962
	},
	"steps_from_proto": {
	"total": 94.34097111398933,
	"count": 63626,
	"is_parallel": true,
	"self": 18.976875728015784,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 75.36409538597354,
	"count": 509008,
	"is_parallel": true,
	"self": 75.36409538597354
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 798.3620023149931,
	"count": 63627,
	"self": 2.6710232680313766,
	"children": {
	"process_trajectory": {
	"total": 125.1857095709654,
	"count": 63627,
	"self": 125.00212068996575,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.18358888099965043,
	"count": 2,
	"self": 0.18358888099965043
	}
	}
	},
	"_update_policy": {
	"total": 670.5052694759963,
	"count": 450,
	"self": 285.2489153439758,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 385.25635413202053,
	"count": 22785,
	"self": 385.25635413202053
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 9.54999904934084e-07,
	"count": 1,
	"self": 9.54999904934084e-07
	},
	"TrainerController._save_models": {
	"total": 0.06451446500022939,
	"count": 1,
	"self": 0.001570430000356282,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.06294403499987311,
	"count": 1,
	"self": 0.06294403499987311
	}
	}
	}
	}
	}
	}
	}