First commit

a891092 verified 8 months ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.4484938085079193,
	"min": 0.4484938085079193,
	"max": 1.507041573524475,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 13361.52734375,
	"min": 13361.52734375,
	"max": 45717.61328125,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989890.0,
	"min": 29952.0,
	"max": 989890.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989890.0,
	"min": 29952.0,
	"max": 989890.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.24449053406715393,
	"min": -0.08303222805261612,
	"max": 0.34761524200439453,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 62.34508514404297,
	"min": -19.927734375,
	"max": 90.37995910644531,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": -1.879557490348816,
	"min": -1.9528666734695435,
	"max": 2.180330753326416,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": -479.28717041015625,
	"min": -509.6982116699219,
	"max": 566.885986328125,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.0711138052494524,
	"min": 0.06491783739918554,
	"max": 0.07402172435731044,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9955932734923337,
	"min": 0.48381534922532143,
	"max": 1.0571641896830817,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.523038732927196,
	"min": 0.00012919346758292347,
	"max": 0.523038732927196,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 7.322542260980745,
	"min": 0.0018087085461609286,
	"max": 7.322542260980745,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.289090427478574e-06,
	"min": 7.289090427478574e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010204726598470004,
	"min": 0.00010204726598470004,
	"max": 0.0032558954147015994,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10242966428571428,
	"min": 0.10242966428571428,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4340152999999998,
	"min": 1.3691136000000002,
	"max": 2.4431072000000005,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.0002527234621428573,
	"min": 0.0002527234621428573,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.003538128470000002,
	"min": 0.003538128470000002,
	"max": 0.10855131016000003,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.009125393815338612,
	"min": 0.009125393815338612,
	"max": 0.41734614968299866,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.12775550782680511,
	"min": 0.12775550782680511,
	"max": 2.9214229583740234,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 571.2307692307693,
	"min": 495.52542372881356,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 29704.0,
	"min": 15984.0,
	"max": 32747.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.0825345877271433,
	"min": -1.0000000521540642,
	"max": 1.2685573508993524,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 56.29179856181145,
	"min": -32.000001668930054,
	"max": 77.3819984048605,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.0825345877271433,
	"min": -1.0000000521540642,
	"max": 1.2685573508993524,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 56.29179856181145,
	"min": -32.000001668930054,
	"max": 77.3819984048605,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.054566108950754054,
	"min": 0.05042585650493284,
	"max": 8.928653911687434,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.837437665439211,
	"min": 2.837437665439211,
	"max": 142.85846258699894,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1750681963",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.7.1+cu126",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1750684028"
	},
	"total": 2064.788200636,
	"count": 1,
	"self": 0.5462420210001255,
	"children": {
	"run_training.setup": {
	"total": 0.023352799999997842,
	"count": 1,
	"self": 0.023352799999997842
	},
	"TrainerController.start_learning": {
	"total": 2064.218605815,
	"count": 1,
	"self": 1.2372683429771314,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.893654857999991,
	"count": 1,
	"self": 3.893654857999991
	},
	"TrainerController.advance": {
	"total": 2059.007950086023,
	"count": 63415,
	"self": 1.3015567399934298,
	"children": {
	"env_step": {
	"total": 1410.5149525910017,
	"count": 63415,
	"self": 1266.0507895819883,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 143.72092754401172,
	"count": 63415,
	"self": 4.353773891001765,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 139.36715365300995,
	"count": 62571,
	"self": 139.36715365300995
	}
	}
	},
	"workers": {
	"total": 0.7432354650015895,
	"count": 63415,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2059.430335816015,
	"count": 63415,
	"is_parallel": true,
	"self": 900.7864853950146,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.006355205999966529,
	"count": 1,
	"is_parallel": true,
	"self": 0.00448609399995803,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0018691120000084993,
	"count": 8,
	"is_parallel": true,
	"self": 0.0018691120000084993
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.046859011000037754,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005552520000264849,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0004497239999636804,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004497239999636804
	},
	"communicator.exchange": {
	"total": 0.04431933000000754,
	"count": 1,
	"is_parallel": true,
	"self": 0.04431933000000754
	},
	"steps_from_proto": {
	"total": 0.0015347050000400486,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003312390000473897,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001203465999992659,
	"count": 8,
	"is_parallel": true,
	"self": 0.001203465999992659
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1158.6438504210005,
	"count": 63414,
	"is_parallel": true,
	"self": 31.204137168012494,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 21.797103267958278,
	"count": 63414,
	"is_parallel": true,
	"self": 21.797103267958278
	},
	"communicator.exchange": {
	"total": 1014.5155729170086,
	"count": 63414,
	"is_parallel": true,
	"self": 1014.5155729170086
	},
	"steps_from_proto": {
	"total": 91.12703706802108,
	"count": 63414,
	"is_parallel": true,
	"self": 17.963086770020368,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 73.16395029800071,
	"count": 507312,
	"is_parallel": true,
	"self": 73.16395029800071
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 647.1914407550277,
	"count": 63415,
	"self": 2.358597632058718,
	"children": {
	"process_trajectory": {
	"total": 121.70408041196868,
	"count": 63415,
	"self": 121.42279381996866,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.28128659200001493,
	"count": 2,
	"self": 0.28128659200001493
	}
	}
	},
	"_update_policy": {
	"total": 523.1287627110003,
	"count": 443,
	"self": 290.450171928984,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 232.67859078201627,
	"count": 22788,
	"self": 232.67859078201627
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.0579997251625173e-06,
	"count": 1,
	"self": 1.0579997251625173e-06
	},
	"TrainerController._save_models": {
	"total": 0.07973147000029712,
	"count": 1,
	"self": 0.0012926150006933312,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.07843885499960379,
	"count": 1,
	"self": 0.07843885499960379
	}
	}
	}
	}
	}
	}
	}