First Push

1d4e1cb verified 8 months ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.4158688485622406,
	"min": 0.4158688485622406,
	"max": 1.4334027767181396,
	"count": 38
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 12482.7197265625,
	"min": 12482.7197265625,
	"max": 43483.70703125,
	"count": 38
	},
	"Pyramids.Step.mean": {
	"value": 1139954.0,
	"min": 29902.0,
	"max": 1139954.0,
	"count": 38
	},
	"Pyramids.Step.sum": {
	"value": 1139954.0,
	"min": 29902.0,
	"max": 1139954.0,
	"count": 38
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.4747034013271332,
	"min": -0.09710239619016647,
	"max": 0.5281603932380676,
	"count": 38
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 129.11932373046875,
	"min": -23.40167808532715,
	"max": 143.1314697265625,
	"count": 38
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.003889927174896002,
	"min": -0.0016563987592235208,
	"max": 0.32075613737106323,
	"count": 38
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 1.0580601692199707,
	"min": -0.4207252860069275,
	"max": 76.01920318603516,
	"count": 38
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.0710136718435457,
	"min": 0.06403720775751708,
	"max": 0.0738912057907631,
	"count": 38
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9941914058096398,
	"min": 0.5896578854585877,
	"max": 1.1083680868614465,
	"count": 38
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.015340565439102996,
	"min": 0.00017771699159691522,
	"max": 0.016487775863264505,
	"count": 38
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.21476791614744195,
	"min": 0.002310320890759898,
	"max": 0.21476791614744195,
	"count": 38
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 0.00018746620893984764,
	"min": 0.00018746620893984764,
	"max": 0.0002984035255321583,
	"count": 38
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.002624526925157867,
	"min": 0.0023872282042572664,
	"max": 0.0039274579908473665,
	"count": 38
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.1624887238095238,
	"min": 0.1624887238095238,
	"max": 0.19946784166666667,
	"count": 38
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 2.2748421333333333,
	"min": 1.5957427333333334,
	"max": 2.709152633333334,
	"count": 38
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0062526235085714294,
	"min": 0.0062526235085714294,
	"max": 0.0099468373825,
	"count": 38
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.08753672912000002,
	"min": 0.07957469906,
	"max": 0.13092434807000003,
	"count": 38
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.007184040267020464,
	"min": 0.006830547470599413,
	"max": 0.5138049721717834,
	"count": 38
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.10057656466960907,
	"min": 0.09562766551971436,
	"max": 4.110439777374268,
	"count": 38
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 377.5243902439024,
	"min": 377.15384615384613,
	"max": 999.0,
	"count": 38
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30957.0,
	"min": 16829.0,
	"max": 33338.0,
	"count": 38
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.5004975409587709,
	"min": -0.9998645681527353,
	"max": 1.5202461353097207,
	"count": 38
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 123.04079835861921,
	"min": -30.995801612734795,
	"max": 123.04079835861921,
	"count": 38
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.5004975409587709,
	"min": -0.9998645681527353,
	"max": 1.5202461353097207,
	"count": 38
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 123.04079835861921,
	"min": -30.995801612734795,
	"max": 123.04079835861921,
	"count": 38
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.028667418900934025,
	"min": 0.028667418900934025,
	"max": 11.179093125988455,
	"count": 38
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.35072834987659,
	"min": 2.060942495649215,
	"max": 190.04458314180374,
	"count": 38
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 38
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 38
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1749370516",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.7.1+cu126",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1749373063"
	},
	"total": 2547.045255888,
	"count": 1,
	"self": 0.5769756640006563,
	"children": {
	"run_training.setup": {
	"total": 0.02166395300014301,
	"count": 1,
	"self": 0.02166395300014301
	},
	"TrainerController.start_learning": {
	"total": 2546.4466162709996,
	"count": 1,
	"self": 1.5921405469612182,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.2480135420000806,
	"count": 1,
	"self": 2.2480135420000806
	},
	"TrainerController.advance": {
	"total": 2542.3611137560397,
	"count": 73564,
	"self": 1.658556076019977,
	"children": {
	"env_step": {
	"total": 1745.9980852639992,
	"count": 73564,
	"self": 1558.3319822050498,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 186.72180298093986,
	"count": 73564,
	"self": 5.507459227936806,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 181.21434375300305,
	"count": 72429,
	"self": 181.21434375300305
	}
	}
	},
	"workers": {
	"total": 0.944300078009519,
	"count": 73564,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2539.0924085559723,
	"count": 73564,
	"is_parallel": true,
	"self": 1115.5424509109469,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0032895009999265312,
	"count": 1,
	"is_parallel": true,
	"self": 0.0009728090003591205,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0023166919995674107,
	"count": 8,
	"is_parallel": true,
	"self": 0.0023166919995674107
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.0506185239999013,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005873399998108653,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0004933090001486562,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004933090001486562
	},
	"communicator.exchange": {
	"total": 0.0478301680000186,
	"count": 1,
	"is_parallel": true,
	"self": 0.0478301680000186
	},
	"steps_from_proto": {
	"total": 0.0017077069999231753,
	"count": 1,
	"is_parallel": true,
	"self": 0.00034873799972956476,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013589690001936106,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013589690001936106
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1423.5499576450254,
	"count": 73563,
	"is_parallel": true,
	"self": 37.52510681484796,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 28.12623081507263,
	"count": 73563,
	"is_parallel": true,
	"self": 28.12623081507263
	},
	"communicator.exchange": {
	"total": 1242.7567264091165,
	"count": 73563,
	"is_parallel": true,
	"self": 1242.7567264091165
	},
	"steps_from_proto": {
	"total": 115.14189360598834,
	"count": 73563,
	"is_parallel": true,
	"self": 23.262269771694264,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 91.87962383429408,
	"count": 588504,
	"is_parallel": true,
	"self": 91.87962383429408
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 794.7044724160207,
	"count": 73564,
	"self": 2.988573217009389,
	"children": {
	"process_trajectory": {
	"total": 153.60908939901242,
	"count": 73564,
	"self": 153.39238200101204,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.21670739800038064,
	"count": 2,
	"self": 0.21670739800038064
	}
	}
	},
	"_update_policy": {
	"total": 638.1068097999989,
	"count": 530,
	"self": 351.4865674349787,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 286.6202423650202,
	"count": 26347,
	"self": 286.6202423650202
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.312999302172102e-06,
	"count": 1,
	"self": 1.312999302172102e-06
	},
	"TrainerController._save_models": {
	"total": 0.24534711299929768,
	"count": 1,
	"self": 0.008250718999079254,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.23709639400021842,
	"count": 1,
	"self": 0.23709639400021842
	}
	}
	}
	}
	}
	}
	}