Pyramids first push

73d01f2 verified almost 2 years ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.6509416103363037,
	"min": 0.6509416103363037,
	"max": 1.4029514789581299,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 19444.927734375,
	"min": 19444.927734375,
	"max": 42559.9375,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989879.0,
	"min": 29952.0,
	"max": 989879.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989879.0,
	"min": 29952.0,
	"max": 989879.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.3457738161087036,
	"min": -0.2010049670934677,
	"max": 0.4050307869911194,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 90.24696350097656,
	"min": -47.63817596435547,
	"max": 106.92813110351562,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 135.45318603515625,
	"min": -0.0005455068894661963,
	"max": 135.45318603515625,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 35353.28125,
	"min": -0.13746774196624756,
	"max": 35353.28125,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.07116542290618998,
	"min": 0.06388296890197255,
	"max": 0.07385484702164331,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9963159206866596,
	"min": 0.4817108204762247,
	"max": 1.0532231060913582,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 1851.6963029361907,
	"min": 0.00024384026576801846,
	"max": 1851.6963029361907,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 25923.74824110667,
	"min": 0.0025457051088406558,
	"max": 25923.74824110667,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.300640423628573e-06,
	"min": 7.300640423628573e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010220896593080002,
	"min": 0.00010220896593080002,
	"max": 0.0030219080926974003,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10243351428571427,
	"min": 0.10243351428571427,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4340692,
	"min": 1.3886848,
	"max": 2.4009790000000004,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00025310807714285725,
	"min": 0.00025310807714285725,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0035435130800000017,
	"min": 0.0035435130800000017,
	"max": 0.10075952973999999,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.00783002283424139,
	"min": 0.00782970804721117,
	"max": 0.35662126541137695,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.10962032526731491,
	"min": 0.10961591452360153,
	"max": 2.4963488578796387,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 480.453125,
	"min": 432.96923076923076,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30749.0,
	"min": 15984.0,
	"max": 32905.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.3007280931342393,
	"min": -1.0000000521540642,
	"max": 1.5362522881764633,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 83.24659796059132,
	"min": -32.000001668930054,
	"max": 99.85639873147011,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.3007280931342393,
	"min": -1.0000000521540642,
	"max": 1.5362522881764633,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 83.24659796059132,
	"min": -32.000001668930054,
	"max": 99.85639873147011,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.04010859162281122,
	"min": 0.03515081175047761,
	"max": 7.064080120995641,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.566949863859918,
	"min": 2.2848027637810446,
	"max": 113.02528193593025,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1710786859",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn /content/ml-agents/config/ppo/PyramidsRND.yaml --env=/content/training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.0.0",
	"mlagents_envs_version": "1.0.0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.2.1+cu121",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1710788925"
	},
	"total": 2065.710465668,
	"count": 1,
	"self": 0.5936395920007271,
	"children": {
	"run_training.setup": {
	"total": 0.10453902899962486,
	"count": 1,
	"self": 0.10453902899962486
	},
	"TrainerController.start_learning": {
	"total": 2065.0122870469995,
	"count": 1,
	"self": 1.2720890359605619,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.141118183000344,
	"count": 1,
	"self": 4.141118183000344
	},
	"TrainerController.advance": {
	"total": 2059.508407389039,
	"count": 63335,
	"self": 1.3779396110348898,
	"children": {
	"env_step": {
	"total": 1401.782214859019,
	"count": 63335,
	"self": 1273.0833209249695,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 127.91015102903384,
	"count": 63335,
	"self": 4.6484490040134006,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 123.26170202502044,
	"count": 62557,
	"self": 123.26170202502044
	}
	}
	},
	"workers": {
	"total": 0.7887429050156243,
	"count": 63335,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2060.2796150749655,
	"count": 63335,
	"is_parallel": true,
	"self": 896.9964837560178,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.005344448999949236,
	"count": 1,
	"is_parallel": true,
	"self": 0.003886063999743783,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014583850002054533,
	"count": 8,
	"is_parallel": true,
	"self": 0.0014583850002054533
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.05039602599981663,
	"count": 1,
	"is_parallel": true,
	"self": 0.000611895000020013,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0004999789998691995,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004999789998691995
	},
	"communicator.exchange": {
	"total": 0.04751114500004405,
	"count": 1,
	"is_parallel": true,
	"self": 0.04751114500004405
	},
	"steps_from_proto": {
	"total": 0.0017730069998833642,
	"count": 1,
	"is_parallel": true,
	"self": 0.00037849700083825155,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013945099990451126,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013945099990451126
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1163.2831313189477,
	"count": 63334,
	"is_parallel": true,
	"self": 34.29297426590665,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 24.028847002978637,
	"count": 63334,
	"is_parallel": true,
	"self": 24.028847002978637
	},
	"communicator.exchange": {
	"total": 998.5090422270491,
	"count": 63334,
	"is_parallel": true,
	"self": 998.5090422270491
	},
	"steps_from_proto": {
	"total": 106.45226782301324,
	"count": 63334,
	"is_parallel": true,
	"self": 20.45399349096897,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 85.99827433204428,
	"count": 506672,
	"is_parallel": true,
	"self": 85.99827433204428
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 656.348252918985,
	"count": 63335,
	"self": 2.3225651520169777,
	"children": {
	"process_trajectory": {
	"total": 120.01191298296544,
	"count": 63335,
	"self": 119.74777153796458,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2641414450008597,
	"count": 2,
	"self": 0.2641414450008597
	}
	}
	},
	"_update_policy": {
	"total": 534.0137747840026,
	"count": 436,
	"self": 331.4164921870338,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 202.59728259696885,
	"count": 22869,
	"self": 202.59728259696885
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.899996828404255e-07,
	"count": 1,
	"self": 8.899996828404255e-07
	},
	"TrainerController._save_models": {
	"total": 0.09067154900003516,
	"count": 1,
	"self": 0.0015128670002013678,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08915868199983379,
	"count": 1,
	"self": 0.08915868199983379
	}
	}
	}
	}
	}
	}
	}