ppo-SnowballTarget / run_logs /timers.json

First Push

96ec9c6 verified about 1 month ago

19.3 kB

	{
	"name": "root",
	"gauges": {
	"SnowballTarget.Policy.Entropy.mean": {
	"value": 1.0191810131072998,
	"min": 1.0125811100006104,
	"max": 2.8851497173309326,
	"count": 100
	},
	"SnowballTarget.Policy.Entropy.sum": {
	"value": 9820.828125,
	"min": 8866.5263671875,
	"max": 41352.8515625,
	"count": 100
	},
	"SnowballTarget.Step.mean": {
	"value": 999952.0,
	"min": 9952.0,
	"max": 999952.0,
	"count": 100
	},
	"SnowballTarget.Step.sum": {
	"value": 999952.0,
	"min": 9952.0,
	"max": 999952.0,
	"count": 100
	},
	"SnowballTarget.Policy.ExtrinsicValueEstimate.mean": {
	"value": 14.220526695251465,
	"min": 0.41513773798942566,
	"max": 14.232309341430664,
	"count": 100
	},
	"SnowballTarget.Policy.ExtrinsicValueEstimate.sum": {
	"value": 1393.611572265625,
	"min": 40.26836013793945,
	"max": 1494.2806396484375,
	"count": 100
	},
	"SnowballTarget.Policy.CuriosityValueEstimate.mean": {
	"value": 0.04185193032026291,
	"min": -0.29990190267562866,
	"max": 0.06766362488269806,
	"count": 100
	},
	"SnowballTarget.Policy.CuriosityValueEstimate.sum": {
	"value": 4.101489067077637,
	"min": -29.090484619140625,
	"max": 6.643495082855225,
	"count": 100
	},
	"SnowballTarget.Environment.EpisodeLength.mean": {
	"value": 199.0,
	"min": 199.0,
	"max": 199.0,
	"count": 100
	},
	"SnowballTarget.Environment.EpisodeLength.sum": {
	"value": 8756.0,
	"min": 8756.0,
	"max": 13134.0,
	"count": 100
	},
	"SnowballTarget.Environment.CumulativeReward.mean": {
	"value": 27.622222222222224,
	"min": 3.022727272727273,
	"max": 28.295454545454547,
	"count": 100
	},
	"SnowballTarget.Environment.CumulativeReward.sum": {
	"value": 1243.0,
	"min": 133.0,
	"max": 1697.0,
	"count": 100
	},
	"SnowballTarget.Policy.ExtrinsicReward.mean": {
	"value": 27.622222222222224,
	"min": 3.022727272727273,
	"max": 28.295454545454547,
	"count": 100
	},
	"SnowballTarget.Policy.ExtrinsicReward.sum": {
	"value": 1243.0,
	"min": 133.0,
	"max": 1697.0,
	"count": 100
	},
	"SnowballTarget.Policy.CuriosityReward.mean": {
	"value": 0.08641067225899961,
	"min": 0.0,
	"max": 0.29597962292080576,
	"count": 100
	},
	"SnowballTarget.Policy.CuriosityReward.sum": {
	"value": 3.8884802516549826,
	"min": 0.0,
	"max": 13.023103408515453,
	"count": 100
	},
	"SnowballTarget.Losses.PolicyLoss.mean": {
	"value": 0.13800820862084176,
	"min": 0.10502773270744717,
	"max": 0.2210215118389125,
	"count": 100
	},
	"SnowballTarget.Losses.PolicyLoss.sum": {
	"value": 0.13800820862084176,
	"min": 0.10502773270744717,
	"max": 0.4027854288067443,
	"count": 100
	},
	"SnowballTarget.Losses.ValueLoss.mean": {
	"value": 0.08755119573889357,
	"min": 0.06235209942767114,
	"max": 0.1533522138541395,
	"count": 100
	},
	"SnowballTarget.Losses.ValueLoss.sum": {
	"value": 0.08755119573889357,
	"min": 0.06235209942767114,
	"max": 0.30033070142522,
	"count": 100
	},
	"SnowballTarget.Policy.LearningRate.mean": {
	"value": 1.4952995015999965e-06,
	"min": 1.4952995015999965e-06,
	"max": 0.00029736000087999994,
	"count": 100
	},
	"SnowballTarget.Policy.LearningRate.sum": {
	"value": 1.4952995015999965e-06,
	"min": 1.4952995015999965e-06,
	"max": 0.0005551200149599999,
	"count": 100
	},
	"SnowballTarget.Policy.Epsilon.mean": {
	"value": 0.1004984,
	"min": 0.1004984,
	"max": 0.19912000000000002,
	"count": 100
	},
	"SnowballTarget.Policy.Epsilon.sum": {
	"value": 0.1004984,
	"min": 0.1004984,
	"max": 0.38504000000000005,
	"count": 100
	},
	"SnowballTarget.Policy.Beta.mean": {
	"value": 3.487015999999995e-05,
	"min": 3.487015999999995e-05,
	"max": 0.004956088,
	"count": 100
	},
	"SnowballTarget.Policy.Beta.sum": {
	"value": 3.487015999999995e-05,
	"min": 3.487015999999995e-05,
	"max": 0.009253496,
	"count": 100
	},
	"SnowballTarget.Losses.CuriosityForwardLoss.mean": {
	"value": 0.0420269084473451,
	"min": 0.04060459949753501,
	"max": 0.3548051611040578,
	"count": 100
	},
	"SnowballTarget.Losses.CuriosityForwardLoss.sum": {
	"value": 0.0420269084473451,
	"min": 0.04060459949753501,
	"max": 0.3548051611040578,
	"count": 100
	},
	"SnowballTarget.Losses.CuriosityInverseLoss.mean": {
	"value": 0.8903695670041171,
	"min": 0.8837436121521574,
	"max": 2.870172796827374,
	"count": 100
	},
	"SnowballTarget.Losses.CuriosityInverseLoss.sum": {
	"value": 0.8903695670041171,
	"min": 0.8903695670041171,
	"max": 4.892745487617724,
	"count": 100
	},
	"SnowballTarget.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	},
	"SnowballTarget.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 100
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1768629609",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget_v2 --no-graphics --num-envs=4 --force",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.8.0+cu128",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1768630491"
	},
	"total": 881.6892560720444,
	"count": 1,
	"self": 0.5809017717838287,
	"children": {
	"run_training.setup": {
	"total": 0.08153192698955536,
	"count": 1,
	"self": 0.08153192698955536
	},
	"TrainerController.start_learning": {
	"total": 881.026822373271,
	"count": 1,
	"self": 1.2454327493906021,
	"children": {
	"TrainerController._reset_env": {
	"total": 4.511491026729345,
	"count": 1,
	"self": 4.511491026729345
	},
	"TrainerController.advance": {
	"total": 874.9155791327357,
	"count": 85836,
	"self": 1.1708364188671112,
	"children": {
	"env_step": {
	"total": 498.63419465348125,
	"count": 85836,
	"self": 171.03251956030726,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 326.7886832021177,
	"count": 91007,
	"self": 4.9086459912359715,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 321.8800372108817,
	"count": 91007,
	"self": 321.8800372108817
	}
	}
	},
	"workers": {
	"total": 0.8129918910562992,
	"count": 85836,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 3516.008899267763,
	"count": 91004,
	"is_parallel": true,
	"self": 2077.2471702061594,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.013634655624628067,
	"count": 4,
	"is_parallel": true,
	"self": 0.0038620606064796448,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.009772595018148422,
	"count": 40,
	"is_parallel": true,
	"self": 0.009772595018148422
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.14024678990244865,
	"count": 4,
	"is_parallel": true,
	"self": 0.003130599856376648,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.001779858022928238,
	"count": 4,
	"is_parallel": true,
	"self": 0.001779858022928238
	},
	"communicator.exchange": {
	"total": 0.12624675035476685,
	"count": 4,
	"is_parallel": true,
	"self": 0.12624675035476685
	},
	"steps_from_proto": {
	"total": 0.009089581668376923,
	"count": 4,
	"is_parallel": true,
	"self": 0.0016513243317604065,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.007438257336616516,
	"count": 40,
	"is_parallel": true,
	"self": 0.007438257336616516
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1438.7617290616035,
	"count": 91000,
	"is_parallel": true,
	"self": 57.816723734140396,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 31.81670133769512,
	"count": 91000,
	"is_parallel": true,
	"self": 31.81670133769512
	},
	"communicator.exchange": {
	"total": 1182.3738483600318,
	"count": 91000,
	"is_parallel": true,
	"self": 1182.3738483600318
	},
	"steps_from_proto": {
	"total": 166.75445562973619,
	"count": 91000,
	"is_parallel": true,
	"self": 29.058784492313862,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 137.69567113742232,
	"count": 910000,
	"is_parallel": true,
	"self": 137.69567113742232
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 375.1105480603874,
	"count": 85836,
	"self": 1.6210341788828373,
	"children": {
	"process_trajectory": {
	"total": 189.18001991137862,
	"count": 85836,
	"self": 181.35321673750877,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 7.826803173869848,
	"count": 20,
	"self": 7.826803173869848
	}
	}
	},
	"_update_policy": {
	"total": 184.3094939701259,
	"count": 113,
	"self": 88.27203316241503,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 96.03746080771089,
	"count": 3729,
	"self": 96.03746080771089
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 6.92903995513916e-07,
	"count": 1,
	"self": 6.92903995513916e-07
	},
	"TrainerController._save_models": {
	"total": 0.3543187715113163,
	"count": 1,
	"self": 0.026383914053440094,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.3279348574578762,
	"count": 1,
	"self": 0.3279348574578762
	}
	}
	}
	}
	}
	}
	}