First Push

143f6ca verified 6 months ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.7488517761230469,
	"min": 0.6447844505310059,
	"max": 1.5459904670715332,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 22393.6640625,
	"min": 19271.318359375,
	"max": 46899.16796875,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989872.0,
	"min": 29952.0,
	"max": 989872.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989872.0,
	"min": 29952.0,
	"max": 989872.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.019289691001176834,
	"min": -0.10402826964855194,
	"max": 0.04871964454650879,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 4.725974082946777,
	"min": -24.966785430908203,
	"max": 11.887593269348145,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.008578427135944366,
	"min": -0.007467157207429409,
	"max": 0.15129059553146362,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 2.101714611053467,
	"min": -1.7697162628173828,
	"max": 36.30974197387695,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06973546571499975,
	"min": 0.06537674973998121,
	"max": 0.07336444405777964,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9762965200099966,
	"min": 0.49905418185082306,
	"max": 1.0727976258203853,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.004404868398465874,
	"min": 2.3950339148027197e-05,
	"max": 0.004720671249880307,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.06166815757852224,
	"min": 0.0003592550872204079,
	"max": 0.06608939749832429,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.324533272807142e-06,
	"min": 7.324533272807142e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010254346581929999,
	"min": 0.00010254346581929999,
	"max": 0.0032603807132064993,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10244147857142857,
	"min": 0.10244147857142857,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4341807,
	"min": 1.3691136000000002,
	"max": 2.3867935000000005,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0002539037092857143,
	"min": 0.0002539037092857143,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0035546519300000004,
	"min": 0.0035546519300000004,
	"max": 0.10870067065,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.011813228018581867,
	"min": 0.011813228018581867,
	"max": 0.2889266312122345,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.1653851866722107,
	"min": 0.1653851866722107,
	"max": 2.022486448287964,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 852.3421052631579,
	"min": 842.6578947368421,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 32389.0,
	"min": 15984.0,
	"max": 32389.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": -0.22116319972433543,
	"min": -1.0000000521540642,
	"max": -0.158852681517601,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": -8.404201589524746,
	"min": -32.000001668930054,
	"max": -6.0364018976688385,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": -0.22116319972433543,
	"min": -1.0000000521540642,
	"max": -0.158852681517601,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": -8.404201589524746,
	"min": -32.000001668930054,
	"max": -6.0364018976688385,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.10468380591881118,
	"min": 0.10468380591881118,
	"max": 5.415352387353778,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 3.977984624914825,
	"min": 3.644634314114228,
	"max": 86.64563819766045,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1756043291",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.8.0+cu128",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1756047050"
	},
	"total": 3758.784336188,
	"count": 1,
	"self": 1.4299364990001777,
	"children": {
	"run_training.setup": {
	"total": 0.05578594000007797,
	"count": 1,
	"self": 0.05578594000007797
	},
	"TrainerController.start_learning": {
	"total": 3757.2986137489997,
	"count": 1,
	"self": 2.972953364021123,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.8633677860002535,
	"count": 1,
	"self": 3.8633677860002535
	},
	"TrainerController.advance": {
	"total": 3750.319426425978,
	"count": 63160,
	"self": 3.167747282931032,
	"children": {
	"env_step": {
	"total": 2438.8047455879855,
	"count": 63160,
	"self": 2228.4151067950697,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 208.6100466389289,
	"count": 63160,
	"self": 10.403559045033944,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 198.20648759389496,
	"count": 62568,
	"self": 198.20648759389496
	}
	}
	},
	"workers": {
	"total": 1.7795921539868687,
	"count": 63160,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 3746.5845889058796,
	"count": 63160,
	"is_parallel": true,
	"self": 1738.4553816398065,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0037214529997982027,
	"count": 1,
	"is_parallel": true,
	"self": 0.0013413769997896452,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0023800760000085575,
	"count": 8,
	"is_parallel": true,
	"self": 0.0023800760000085575
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.07902737299991713,
	"count": 1,
	"is_parallel": true,
	"self": 0.0007203630002550199,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005590229998233553,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005590229998233553
	},
	"communicator.exchange": {
	"total": 0.07567841799982489,
	"count": 1,
	"is_parallel": true,
	"self": 0.07567841799982489
	},
	"steps_from_proto": {
	"total": 0.002069569000013871,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004698779998761893,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0015996910001376818,
	"count": 8,
	"is_parallel": true,
	"self": 0.0015996910001376818
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 2008.129207266073,
	"count": 63159,
	"is_parallel": true,
	"self": 53.55146999118733,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 34.69607676503256,
	"count": 63159,
	"is_parallel": true,
	"self": 34.69607676503256
	},
	"communicator.exchange": {
	"total": 1772.9666636139295,
	"count": 63159,
	"is_parallel": true,
	"self": 1772.9666636139295
	},
	"steps_from_proto": {
	"total": 146.91499689592365,
	"count": 63159,
	"is_parallel": true,
	"self": 32.5446596998504,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 114.37033719607325,
	"count": 505272,
	"is_parallel": true,
	"self": 114.37033719607325
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1308.3469335550612,
	"count": 63160,
	"self": 5.622210516978612,
	"children": {
	"process_trajectory": {
	"total": 200.20308955808787,
	"count": 63160,
	"self": 199.86270891208778,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.3403806460000851,
	"count": 2,
	"self": 0.3403806460000851
	}
	}
	},
	"_update_policy": {
	"total": 1102.5216334799948,
	"count": 439,
	"self": 421.2265963449954,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 681.2950371349993,
	"count": 22827,
	"self": 681.2950371349993
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.5539999367319979e-06,
	"count": 1,
	"self": 1.5539999367319979e-06
	},
	"TrainerController._save_models": {
	"total": 0.1428646190006475,
	"count": 1,
	"self": 0.0066819500007113675,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.13618266899993614,
	"count": 1,
	"self": 0.13618266899993614
	}
	}
	}
	}
	}
	}
	}