| { | |
| "name": "root", | |
| "gauges": { | |
| "Pyramids.Policy.Entropy.mean": { | |
| "value": 0.4158688485622406, | |
| "min": 0.4158688485622406, | |
| "max": 1.4334027767181396, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.Entropy.sum": { | |
| "value": 12482.7197265625, | |
| "min": 12482.7197265625, | |
| "max": 43483.70703125, | |
| "count": 38 | |
| }, | |
| "Pyramids.Step.mean": { | |
| "value": 1139954.0, | |
| "min": 29902.0, | |
| "max": 1139954.0, | |
| "count": 38 | |
| }, | |
| "Pyramids.Step.sum": { | |
| "value": 1139954.0, | |
| "min": 29902.0, | |
| "max": 1139954.0, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.mean": { | |
| "value": 0.4747034013271332, | |
| "min": -0.09710239619016647, | |
| "max": 0.5281603932380676, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.ExtrinsicValueEstimate.sum": { | |
| "value": 129.11932373046875, | |
| "min": -23.40167808532715, | |
| "max": 143.1314697265625, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.mean": { | |
| "value": 0.003889927174896002, | |
| "min": -0.0016563987592235208, | |
| "max": 0.32075613737106323, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.RndValueEstimate.sum": { | |
| "value": 1.0580601692199707, | |
| "min": -0.4207252860069275, | |
| "max": 76.01920318603516, | |
| "count": 38 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.mean": { | |
| "value": 0.0710136718435457, | |
| "min": 0.06403720775751708, | |
| "max": 0.0738912057907631, | |
| "count": 38 | |
| }, | |
| "Pyramids.Losses.PolicyLoss.sum": { | |
| "value": 0.9941914058096398, | |
| "min": 0.5896578854585877, | |
| "max": 1.1083680868614465, | |
| "count": 38 | |
| }, | |
| "Pyramids.Losses.ValueLoss.mean": { | |
| "value": 0.015340565439102996, | |
| "min": 0.00017771699159691522, | |
| "max": 0.016487775863264505, | |
| "count": 38 | |
| }, | |
| "Pyramids.Losses.ValueLoss.sum": { | |
| "value": 0.21476791614744195, | |
| "min": 0.002310320890759898, | |
| "max": 0.21476791614744195, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.LearningRate.mean": { | |
| "value": 0.00018746620893984764, | |
| "min": 0.00018746620893984764, | |
| "max": 0.0002984035255321583, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.LearningRate.sum": { | |
| "value": 0.002624526925157867, | |
| "min": 0.0023872282042572664, | |
| "max": 0.0039274579908473665, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.Epsilon.mean": { | |
| "value": 0.1624887238095238, | |
| "min": 0.1624887238095238, | |
| "max": 0.19946784166666667, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.Epsilon.sum": { | |
| "value": 2.2748421333333333, | |
| "min": 1.5957427333333334, | |
| "max": 2.709152633333334, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.Beta.mean": { | |
| "value": 0.0062526235085714294, | |
| "min": 0.0062526235085714294, | |
| "max": 0.0099468373825, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.Beta.sum": { | |
| "value": 0.08753672912000002, | |
| "min": 0.07957469906, | |
| "max": 0.13092434807000003, | |
| "count": 38 | |
| }, | |
| "Pyramids.Losses.RNDLoss.mean": { | |
| "value": 0.007184040267020464, | |
| "min": 0.006830547470599413, | |
| "max": 0.5138049721717834, | |
| "count": 38 | |
| }, | |
| "Pyramids.Losses.RNDLoss.sum": { | |
| "value": 0.10057656466960907, | |
| "min": 0.09562766551971436, | |
| "max": 4.110439777374268, | |
| "count": 38 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.mean": { | |
| "value": 377.5243902439024, | |
| "min": 377.15384615384613, | |
| "max": 999.0, | |
| "count": 38 | |
| }, | |
| "Pyramids.Environment.EpisodeLength.sum": { | |
| "value": 30957.0, | |
| "min": 16829.0, | |
| "max": 33338.0, | |
| "count": 38 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.mean": { | |
| "value": 1.5004975409587709, | |
| "min": -0.9998645681527353, | |
| "max": 1.5202461353097207, | |
| "count": 38 | |
| }, | |
| "Pyramids.Environment.CumulativeReward.sum": { | |
| "value": 123.04079835861921, | |
| "min": -30.995801612734795, | |
| "max": 123.04079835861921, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.mean": { | |
| "value": 1.5004975409587709, | |
| "min": -0.9998645681527353, | |
| "max": 1.5202461353097207, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.ExtrinsicReward.sum": { | |
| "value": 123.04079835861921, | |
| "min": -30.995801612734795, | |
| "max": 123.04079835861921, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.RndReward.mean": { | |
| "value": 0.028667418900934025, | |
| "min": 0.028667418900934025, | |
| "max": 11.179093125988455, | |
| "count": 38 | |
| }, | |
| "Pyramids.Policy.RndReward.sum": { | |
| "value": 2.35072834987659, | |
| "min": 2.060942495649215, | |
| "max": 190.04458314180374, | |
| "count": 38 | |
| }, | |
| "Pyramids.IsTraining.mean": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 38 | |
| }, | |
| "Pyramids.IsTraining.sum": { | |
| "value": 1.0, | |
| "min": 1.0, | |
| "max": 1.0, | |
| "count": 38 | |
| } | |
| }, | |
| "metadata": { | |
| "timer_format_version": "0.1.0", | |
| "start_time_seconds": "1749370516", | |
| "python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]", | |
| "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics", | |
| "mlagents_version": "1.2.0.dev0", | |
| "mlagents_envs_version": "1.2.0.dev0", | |
| "communication_protocol_version": "1.5.0", | |
| "pytorch_version": "2.7.1+cu126", | |
| "numpy_version": "1.23.5", | |
| "end_time_seconds": "1749373063" | |
| }, | |
| "total": 2547.045255888, | |
| "count": 1, | |
| "self": 0.5769756640006563, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.02166395300014301, | |
| "count": 1, | |
| "self": 0.02166395300014301 | |
| }, | |
| "TrainerController.start_learning": { | |
| "total": 2546.4466162709996, | |
| "count": 1, | |
| "self": 1.5921405469612182, | |
| "children": { | |
| "TrainerController._reset_env": { | |
| "total": 2.2480135420000806, | |
| "count": 1, | |
| "self": 2.2480135420000806 | |
| }, | |
| "TrainerController.advance": { | |
| "total": 2542.3611137560397, | |
| "count": 73564, | |
| "self": 1.658556076019977, | |
| "children": { | |
| "env_step": { | |
| "total": 1745.9980852639992, | |
| "count": 73564, | |
| "self": 1558.3319822050498, | |
| "children": { | |
| "SubprocessEnvManager._take_step": { | |
| "total": 186.72180298093986, | |
| "count": 73564, | |
| "self": 5.507459227936806, | |
| "children": { | |
| "TorchPolicy.evaluate": { | |
| "total": 181.21434375300305, | |
| "count": 72429, | |
| "self": 181.21434375300305 | |
| } | |
| } | |
| }, | |
| "workers": { | |
| "total": 0.944300078009519, | |
| "count": 73564, | |
| "self": 0.0, | |
| "children": { | |
| "worker_root": { | |
| "total": 2539.0924085559723, | |
| "count": 73564, | |
| "is_parallel": true, | |
| "self": 1115.5424509109469, | |
| "children": { | |
| "run_training.setup": { | |
| "total": 0.0, | |
| "count": 0, | |
| "is_parallel": true, | |
| "self": 0.0, | |
| "children": { | |
| "steps_from_proto": { | |
| "total": 0.0032895009999265312, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0009728090003591205, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0023166919995674107, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0023166919995674107 | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 0.0506185239999013, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0005873399998108653, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 0.0004933090001486562, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0004933090001486562 | |
| }, | |
| "communicator.exchange": { | |
| "total": 0.0478301680000186, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.0478301680000186 | |
| }, | |
| "steps_from_proto": { | |
| "total": 0.0017077069999231753, | |
| "count": 1, | |
| "is_parallel": true, | |
| "self": 0.00034873799972956476, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 0.0013589690001936106, | |
| "count": 8, | |
| "is_parallel": true, | |
| "self": 0.0013589690001936106 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "UnityEnvironment.step": { | |
| "total": 1423.5499576450254, | |
| "count": 73563, | |
| "is_parallel": true, | |
| "self": 37.52510681484796, | |
| "children": { | |
| "UnityEnvironment._generate_step_input": { | |
| "total": 28.12623081507263, | |
| "count": 73563, | |
| "is_parallel": true, | |
| "self": 28.12623081507263 | |
| }, | |
| "communicator.exchange": { | |
| "total": 1242.7567264091165, | |
| "count": 73563, | |
| "is_parallel": true, | |
| "self": 1242.7567264091165 | |
| }, | |
| "steps_from_proto": { | |
| "total": 115.14189360598834, | |
| "count": 73563, | |
| "is_parallel": true, | |
| "self": 23.262269771694264, | |
| "children": { | |
| "_process_rank_one_or_two_observation": { | |
| "total": 91.87962383429408, | |
| "count": 588504, | |
| "is_parallel": true, | |
| "self": 91.87962383429408 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_advance": { | |
| "total": 794.7044724160207, | |
| "count": 73564, | |
| "self": 2.988573217009389, | |
| "children": { | |
| "process_trajectory": { | |
| "total": 153.60908939901242, | |
| "count": 73564, | |
| "self": 153.39238200101204, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.21670739800038064, | |
| "count": 2, | |
| "self": 0.21670739800038064 | |
| } | |
| } | |
| }, | |
| "_update_policy": { | |
| "total": 638.1068097999989, | |
| "count": 530, | |
| "self": 351.4865674349787, | |
| "children": { | |
| "TorchPPOOptimizer.update": { | |
| "total": 286.6202423650202, | |
| "count": 26347, | |
| "self": 286.6202423650202 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| }, | |
| "trainer_threads": { | |
| "total": 1.312999302172102e-06, | |
| "count": 1, | |
| "self": 1.312999302172102e-06 | |
| }, | |
| "TrainerController._save_models": { | |
| "total": 0.24534711299929768, | |
| "count": 1, | |
| "self": 0.008250718999079254, | |
| "children": { | |
| "RLTrainer._checkpoint": { | |
| "total": 0.23709639400021842, | |
| "count": 1, | |
| "self": 0.23709639400021842 | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } | |
| } |