annguyen2004

First Push

7135164 verified about 1 year ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.11878236383199692,
	"min": 0.10809889435768127,
	"max": 1.2392959594726562,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 3557.769287109375,
	"min": 3248.155517578125,
	"max": 37595.28125,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989979.0,
	"min": 29952.0,
	"max": 989979.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989979.0,
	"min": 29952.0,
	"max": 989979.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.0937093123793602,
	"min": -0.13980858027935028,
	"max": -0.03965657576918602,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": -22.490234375,
	"min": -33.1346321105957,
	"max": -9.517578125,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.29258492588996887,
	"min": 0.2259417027235031,
	"max": 0.48964154720306396,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 70.22038269042969,
	"min": 54.45195007324219,
	"max": 117.51396942138672,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.0701524821032039,
	"min": 0.06535336099897435,
	"max": 0.07161272738445458,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9821347494448547,
	"min": 0.5008668755187824,
	"max": 0.9821347494448547,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.0005013788562184888,
	"min": 0.000373782523542247,
	"max": 0.008696133524944761,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.007019303987058843,
	"min": 0.004859172806049211,
	"max": 0.06087293467461333,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.347826122185713e-06,
	"min": 7.347826122185713e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010286956571059998,
	"min": 0.00010286956571059998,
	"max": 0.0031375841541387,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10244924285714285,
	"min": 0.10244924285714285,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4342894,
	"min": 1.3691136000000002,
	"max": 2.3458613,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00025467936142857143,
	"min": 0.00025467936142857143,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0035655110599999997,
	"min": 0.0035655110599999997,
	"max": 0.10461154386999999,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.2888457477092743,
	"min": 0.179472878575325,
	"max": 0.5697922110557556,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 4.043840408325195,
	"min": 2.153674602508545,
	"max": 4.191043376922607,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 999.0,
	"min": 928.0,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 27972.0,
	"min": 15984.0,
	"max": 32726.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": -0.9996500518172979,
	"min": -1.0000000521540642,
	"max": -0.6978154314252046,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": -27.990201450884342,
	"min": -32.000001668930054,
	"max": -16.000000834465027,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": -0.9996500518172979,
	"min": -1.0000000521540642,
	"max": -0.6978154314252046,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": -27.990201450884342,
	"min": -32.000001668930054,
	"max": -16.000000834465027,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 2.846828587885414,
	"min": 1.9769958045799285,
	"max": 10.185381253249943,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 79.71120046079159,
	"min": 56.77791683236137,
	"max": 162.9661000519991,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1739006243",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.6.0+cu124",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1739008490"
	},
	"total": 2246.997819224,
	"count": 1,
	"self": 0.5393444309997903,
	"children": {
	"run_training.setup": {
	"total": 0.024433104999843636,
	"count": 1,
	"self": 0.024433104999843636
	},
	"TrainerController.start_learning": {
	"total": 2246.4340416880004,
	"count": 1,
	"self": 1.5748731400240104,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.960077573000035,
	"count": 1,
	"self": 3.960077573000035
	},
	"TrainerController.advance": {
	"total": 2240.8027684699764,
	"count": 62994,
	"self": 1.6008817979759442,
	"children": {
	"env_step": {
	"total": 1513.275015226022,
	"count": 62994,
	"self": 1335.5422932179872,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 176.80688636500167,
	"count": 62994,
	"self": 5.35005148505752,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 171.45683487994415,
	"count": 62540,
	"self": 171.45683487994415
	}
	}
	},
	"workers": {
	"total": 0.9258356430332242,
	"count": 62994,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2240.684774630029,
	"count": 62994,
	"is_parallel": true,
	"self": 1032.195184332002,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0068483129998639924,
	"count": 1,
	"is_parallel": true,
	"self": 0.004990184000007503,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0018581289998564898,
	"count": 8,
	"is_parallel": true,
	"self": 0.0018581289998564898
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.05441686400013168,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006464980001510412,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.000482693000094514,
	"count": 1,
	"is_parallel": true,
	"self": 0.000482693000094514
	},
	"communicator.exchange": {
	"total": 0.051234337999858326,
	"count": 1,
	"is_parallel": true,
	"self": 0.051234337999858326
	},
	"steps_from_proto": {
	"total": 0.0020533350000278006,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005514749998383195,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001501860000189481,
	"count": 8,
	"is_parallel": true,
	"self": 0.001501860000189481
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1208.489590298027,
	"count": 62993,
	"is_parallel": true,
	"self": 34.57345123904065,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 25.367545844980214,
	"count": 62993,
	"is_parallel": true,
	"self": 25.367545844980214
	},
	"communicator.exchange": {
	"total": 1042.905064199027,
	"count": 62993,
	"is_parallel": true,
	"self": 1042.905064199027
	},
	"steps_from_proto": {
	"total": 105.6435290149791,
	"count": 62993,
	"is_parallel": true,
	"self": 21.54192881193353,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 84.10160020304556,
	"count": 503944,
	"is_parallel": true,
	"self": 84.10160020304556
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 725.9268714459783,
	"count": 62994,
	"self": 2.6566088199870137,
	"children": {
	"process_trajectory": {
	"total": 139.04254404098697,
	"count": 62994,
	"self": 138.7163282629865,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.32621577800046,
	"count": 2,
	"self": 0.32621577800046
	}
	}
	},
	"_update_policy": {
	"total": 584.2277185850044,
	"count": 423,
	"self": 322.1025937070101,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 262.12512487799427,
	"count": 22842,
	"self": 262.12512487799427
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.0199996722803917e-06,
	"count": 1,
	"self": 1.0199996722803917e-06
	},
	"TrainerController._save_models": {
	"total": 0.0963214850003169,
	"count": 1,
	"self": 0.0013519990002350823,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.09496948600008182,
	"count": 1,
	"self": 0.09496948600008182
	}
	}
	}
	}
	}
	}
	}