{ "name": "root", "gauges": { "SnowballTarget.Policy.Entropy.mean": { "value": 0.8370588421821594, "min": 0.8370588421821594, "max": 2.8542063236236572, "count": 20 }, "SnowballTarget.Policy.Entropy.sum": { "value": 8001.4453125, "min": 8001.4453125, "max": 29229.92578125, "count": 20 }, "SnowballTarget.Step.mean": { "value": 199984.0, "min": 9952.0, "max": 199984.0, "count": 20 }, "SnowballTarget.Step.sum": { "value": 199984.0, "min": 9952.0, "max": 199984.0, "count": 20 }, "SnowballTarget.Policy.ExtrinsicValueEstimate.mean": { "value": 13.270687103271484, "min": 0.3743959367275238, "max": 13.270687103271484, "count": 20 }, "SnowballTarget.Policy.ExtrinsicValueEstimate.sum": { "value": 2587.783935546875, "min": 72.6328125, "max": 2680.736328125, "count": 20 }, "SnowballTarget.Environment.EpisodeLength.mean": { "value": 199.0, "min": 199.0, "max": 199.0, "count": 20 }, "SnowballTarget.Environment.EpisodeLength.sum": { "value": 8756.0, "min": 8756.0, "max": 10945.0, "count": 20 }, "SnowballTarget.Losses.PolicyLoss.mean": { "value": 0.0667861311642542, "min": 0.06408279388209956, "max": 0.07503892971376712, "count": 20 }, "SnowballTarget.Losses.PolicyLoss.sum": { "value": 0.2671445246570168, "min": 0.25633117552839824, "max": 0.35178090803092343, "count": 20 }, "SnowballTarget.Losses.ValueLoss.mean": { "value": 0.1812143017702243, "min": 0.1163729392711128, "max": 0.2750221583773108, "count": 20 }, "SnowballTarget.Losses.ValueLoss.sum": { "value": 0.7248572070808972, "min": 0.4654917570844512, "max": 1.347502407080987, "count": 20 }, "SnowballTarget.Policy.LearningRate.mean": { "value": 8.082097306000009e-06, "min": 8.082097306000009e-06, "max": 0.000291882002706, "count": 20 }, "SnowballTarget.Policy.LearningRate.sum": { "value": 3.2328389224000035e-05, "min": 3.2328389224000035e-05, "max": 0.00138516003828, "count": 20 }, "SnowballTarget.Policy.Epsilon.mean": { "value": 0.10269399999999998, "min": 0.10269399999999998, "max": 0.197294, "count": 20 }, "SnowballTarget.Policy.Epsilon.sum": { "value": 0.4107759999999999, "min": 0.4107759999999999, "max": 0.9617200000000001, "count": 20 }, "SnowballTarget.Policy.Beta.mean": { "value": 0.0001444306000000001, "min": 0.0001444306000000001, "max": 0.004864970599999999, "count": 20 }, "SnowballTarget.Policy.Beta.sum": { "value": 0.0005777224000000004, "min": 0.0005777224000000004, "max": 0.023089828, "count": 20 }, "SnowballTarget.Environment.CumulativeReward.mean": { "value": 26.431818181818183, "min": 3.477272727272727, "max": 26.431818181818183, "count": 20 }, "SnowballTarget.Environment.CumulativeReward.sum": { "value": 1163.0, "min": 153.0, "max": 1423.0, "count": 20 }, "SnowballTarget.Policy.ExtrinsicReward.mean": { "value": 26.431818181818183, "min": 3.477272727272727, "max": 26.431818181818183, "count": 20 }, "SnowballTarget.Policy.ExtrinsicReward.sum": { "value": 1163.0, "min": 153.0, "max": 1423.0, "count": 20 }, "SnowballTarget.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 20 }, "SnowballTarget.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 20 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1675610602", "python_version": "3.8.10 (default, Nov 14 2022, 12:59:47) \n[GCC 9.4.0]", "command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/SnowballTarget.yaml --env=./training-envs-executables/linux/SnowballTarget/SnowballTarget --run-id=SnowballTarget1 --no-graphics", "mlagents_version": "0.29.0.dev0", "mlagents_envs_version": "0.29.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "1.8.1+cu102", "numpy_version": "1.21.6", "end_time_seconds": "1675611067" }, "total": 465.2427168659999, "count": 1, "self": 0.38919790499994633, "children": { "run_training.setup": { "total": 0.0999602379999942, "count": 1, "self": 0.0999602379999942 }, "TrainerController.start_learning": { "total": 464.75355872299997, "count": 1, "self": 0.4810203889949207, "children": { "TrainerController._reset_env": { "total": 9.441542031999916, "count": 1, "self": 9.441542031999916 }, "TrainerController.advance": { "total": 454.7069577850052, "count": 18202, "self": 0.24432561801336306, "children": { "env_step": { "total": 454.46263216699185, "count": 18202, "self": 316.41070745497484, "children": { "SubprocessEnvManager._take_step": { "total": 137.80391107698858, "count": 18202, "self": 1.310673067992866, "children": { "TorchPolicy.evaluate": { "total": 136.49323800899572, "count": 18202, "self": 31.371554670018327, "children": { "TorchPolicy.sample_actions": { "total": 105.12168333897739, "count": 18202, "self": 105.12168333897739 } } } } }, "workers": { "total": 0.24801363502842833, "count": 18202, "self": 0.0, "children": { "worker_root": { "total": 463.6436276260017, "count": 18202, "is_parallel": true, "self": 253.07267619502204, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.009333385999980237, "count": 1, "is_parallel": true, "self": 0.004150804999994762, "children": { "_process_rank_one_or_two_observation": { "total": 0.0051825809999854755, "count": 10, "is_parallel": true, "self": 0.0051825809999854755 } } }, "UnityEnvironment.step": { "total": 0.03300163500000508, "count": 1, "is_parallel": true, "self": 0.0005004190001045572, "children": { "UnityEnvironment._generate_step_input": { "total": 0.0002917629999501514, "count": 1, "is_parallel": true, "self": 0.0002917629999501514 }, "communicator.exchange": { "total": 0.030231839999942167, "count": 1, "is_parallel": true, "self": 0.030231839999942167 }, "steps_from_proto": { "total": 0.001977613000008205, "count": 1, "is_parallel": true, "self": 0.0004754599999614584, "children": { "_process_rank_one_or_two_observation": { "total": 0.0015021530000467465, "count": 10, "is_parallel": true, "self": 0.0015021530000467465 } } } } } } }, "UnityEnvironment.step": { "total": 210.57095143097968, "count": 18201, "is_parallel": true, "self": 8.066219149960602, "children": { "UnityEnvironment._generate_step_input": { "total": 4.659429013017416, "count": 18201, "is_parallel": true, "self": 4.659429013017416 }, "communicator.exchange": { "total": 169.4974887249865, "count": 18201, "is_parallel": true, "self": 169.4974887249865 }, "steps_from_proto": { "total": 28.347814543015147, "count": 18201, "is_parallel": true, "self": 5.950530731011554, "children": { "_process_rank_one_or_two_observation": { "total": 22.397283812003593, "count": 182010, "is_parallel": true, "self": 22.397283812003593 } } } } } } } } } } } } }, "trainer_threads": { "total": 4.035200004182116e-05, "count": 1, "self": 4.035200004182116e-05, "children": { "thread_root": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "trainer_advance": { "total": 451.9709286150445, "count": 327152, "is_parallel": true, "self": 8.435361040063754, "children": { "process_trajectory": { "total": 229.3675152119805, "count": 327152, "is_parallel": true, "self": 228.62211618298, "children": { "RLTrainer._checkpoint": { "total": 0.7453990290005095, "count": 4, "is_parallel": true, "self": 0.7453990290005095 } } }, "_update_policy": { "total": 214.16805236300024, "count": 90, "is_parallel": true, "self": 64.24910758399585, "children": { "TorchPPOOptimizer.update": { "total": 149.9189447790044, "count": 7645, "is_parallel": true, "self": 149.9189447790044 } } } } } } } } }, "TrainerController._save_models": { "total": 0.12399816499987537, "count": 1, "self": 0.0009810970000216912, "children": { "RLTrainer._checkpoint": { "total": 0.12301706799985368, "count": 1, "self": 0.12301706799985368 } } } } } } }