First commit, default config

9a16608 verified over 1 year ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.3393213450908661,
	"min": 0.3314994275569916,
	"max": 1.379373550415039,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 10049.3408203125,
	"min": 10008.630859375,
	"max": 39019.71875,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989933.0,
	"min": 29952.0,
	"max": 989933.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989933.0,
	"min": 29952.0,
	"max": 989933.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.6254141330718994,
	"min": -0.08404293656349182,
	"max": 0.6912244558334351,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 180.74468994140625,
	"min": -20.338390350341797,
	"max": 203.21998596191406,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.02734558656811714,
	"min": -0.02242613397538662,
	"max": 0.4648740589618683,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 7.90287446975708,
	"min": -5.9877777099609375,
	"max": 102.73716735839844,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06841825248838398,
	"min": 0.06641222656305348,
	"max": 0.07352544943484582,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9578555348373757,
	"min": 0.4401610603170662,
	"max": 1.0786804384260904,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.016256701561533624,
	"min": 0.002270949388138241,
	"max": 0.016508740748880278,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.22759382186147073,
	"min": 0.022709493881382412,
	"max": 0.2318545042265517,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.4898546462714276e-06,
	"min": 7.4898546462714276e-06,
	"max": 0.00029514240161919995,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010485796504779999,
	"min": 0.00010485796504779999,
	"max": 0.0035089250303584,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10249658571428573,
	"min": 0.10249658571428573,
	"max": 0.19838080000000002,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4349522000000001,
	"min": 1.1902848000000001,
	"max": 2.5696416,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0002594089128571429,
	"min": 0.0002594089128571429,
	"max": 0.009838241919999999,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.00363172478,
	"min": 0.00363172478,
	"max": 0.11698719584000002,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.01445481926202774,
	"min": 0.01445481926202774,
	"max": 0.5669408440589905,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.20236746966838837,
	"min": 0.20236746966838837,
	"max": 3.4016449451446533,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 285.0857142857143,
	"min": 273.0093457943925,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 29934.0,
	"min": 15984.0,
	"max": 33015.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.697030171470822,
	"min": -1.0000000521540642,
	"max": 1.7269906436450013,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 179.88519817590714,
	"min": -30.24240168184042,
	"max": 184.78799887001514,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.697030171470822,
	"min": -1.0000000521540642,
	"max": 1.7269906436450013,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 179.88519817590714,
	"min": -30.24240168184042,
	"max": 184.78799887001514,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.04323365747651858,
	"min": 0.04323365747651858,
	"max": 11.171785168349743,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 4.58276769251097,
	"min": 4.501126918883529,
	"max": 178.7485626935959,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1727570619",
	"python_version": "3.10.12 (main, Sep 11 2024, 15:47:36) [GCC 11.4.0]",
	"command_line_arguments": "venv/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids1 --no-graphics --resume",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.4.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1727572792"
	},
	"total": 2173.1502576000003,
	"count": 1,
	"self": 0.4818422999996983,
	"children": {
	"run_training.setup": {
	"total": 0.01389500000004773,
	"count": 1,
	"self": 0.01389500000004773
	},
	"TrainerController.start_learning": {
	"total": 2172.6545203000005,
	"count": 1,
	"self": 1.5007186000343609,
	"children": {
	"TrainerController._reset_env": {
	"total": 1.388296800000262,
	"count": 1,
	"self": 1.388296800000262
	},
	"TrainerController.advance": {
	"total": 2169.6940161999664,
	"count": 64084,
	"self": 1.4004572000094413,
	"children": {
	"env_step": {
	"total": 1451.9032732999935,
	"count": 64084,
	"self": 1339.2555544999796,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 111.717396799972,
	"count": 64084,
	"self": 4.25997569997935,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 107.45742109999264,
	"count": 62432,
	"self": 107.45742109999264
	}
	}
	},
	"workers": {
	"total": 0.9303220000419969,
	"count": 64084,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2169.356929600043,
	"count": 64084,
	"is_parallel": true,
	"self": 931.6386182001056,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0019157000001541746,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005667000004905276,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001348999999663647,
	"count": 8,
	"is_parallel": true,
	"self": 0.001348999999663647
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.03984710000031555,
	"count": 1,
	"is_parallel": true,
	"self": 0.0002482999998392188,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00021070000002509914,
	"count": 1,
	"is_parallel": true,
	"self": 0.00021070000002509914
	},
	"communicator.exchange": {
	"total": 0.03852080000024216,
	"count": 1,
	"is_parallel": true,
	"self": 0.03852080000024216
	},
	"steps_from_proto": {
	"total": 0.0008673000002090703,
	"count": 1,
	"is_parallel": true,
	"self": 0.00026889999890045146,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0005984000013086188,
	"count": 8,
	"is_parallel": true,
	"self": 0.0005984000013086188
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1237.7183113999372,
	"count": 64083,
	"is_parallel": true,
	"self": 17.496068099939748,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 17.851628199996867,
	"count": 64083,
	"is_parallel": true,
	"self": 17.851628199996867
	},
	"communicator.exchange": {
	"total": 1148.1017410999953,
	"count": 64083,
	"is_parallel": true,
	"self": 1148.1017410999953
	},
	"steps_from_proto": {
	"total": 54.268874000005326,
	"count": 64083,
	"is_parallel": true,
	"self": 14.00552580009753,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 40.263348199907796,
	"count": 512664,
	"is_parallel": true,
	"self": 40.263348199907796
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 716.3902856999634,
	"count": 64084,
	"self": 3.2933098999124013,
	"children": {
	"process_trajectory": {
	"total": 98.82236180005157,
	"count": 64084,
	"self": 98.51106890005167,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.3112928999998985,
	"count": 2,
	"self": 0.3112928999998985
	}
	}
	},
	"_update_policy": {
	"total": 614.2746139999995,
	"count": 454,
	"self": 229.39425380004286,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 384.8803601999566,
	"count": 22755,
	"self": 384.8803601999566
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 7.999997251317836e-07,
	"count": 1,
	"self": 7.999997251317836e-07
	},
	"TrainerController._save_models": {
	"total": 0.07148789999973815,
	"count": 1,
	"self": 0.009067400000276393,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.062420499999461754,
	"count": 1,
	"self": 0.062420499999461754
	}
	}
	}
	}
	}
	}
	}