{ "name": "root", "gauges": { "Pyramids.Policy.Entropy.mean": { "value": 0.14759185910224915, "min": 0.14025941491127014, "max": 0.33215630054473877, "count": 50 }, "Pyramids.Policy.Entropy.sum": { "value": 4484.43115234375, "min": 4207.7822265625, "max": 10171.9541015625, "count": 50 }, "Pyramids.Step.mean": { "value": 2999999.0, "min": 1529929.0, "max": 2999999.0, "count": 50 }, "Pyramids.Step.sum": { "value": 2999999.0, "min": 1529929.0, "max": 2999999.0, "count": 50 }, "Pyramids.Policy.ExtrinsicValueEstimate.mean": { "value": 0.7630169987678528, "min": 0.5922383666038513, "max": 0.7677894830703735, "count": 50 }, "Pyramids.Policy.ExtrinsicValueEstimate.sum": { "value": 225.0900115966797, "min": 165.23451232910156, "max": 228.03347778320312, "count": 50 }, "Pyramids.Policy.RndValueEstimate.mean": { "value": 0.015491118654608727, "min": 0.008117031306028366, "max": 0.0288896132260561, "count": 50 }, "Pyramids.Policy.RndValueEstimate.sum": { "value": 4.56988000869751, "min": 2.370173215866089, "max": 8.233539581298828, "count": 50 }, "Pyramids.Environment.EpisodeLength.mean": { "value": 242.82203389830508, "min": 222.50746268656715, "max": 325.75, "count": 50 }, "Pyramids.Environment.EpisodeLength.sum": { "value": 28653.0, "min": 26537.0, "max": 31592.0, "count": 50 }, "Pyramids.Environment.CumulativeReward.mean": { "value": 1.7571779478151919, "min": 1.586324718850915, "max": 1.777492522637346, "count": 50 }, "Pyramids.Environment.CumulativeReward.sum": { "value": 207.34699784219265, "min": 145.8119983226061, "max": 238.18399803340435, "count": 50 }, "Pyramids.Policy.ExtrinsicReward.mean": { "value": 1.7571779478151919, "min": 1.586324718850915, "max": 1.777492522637346, "count": 50 }, "Pyramids.Policy.ExtrinsicReward.sum": { "value": 207.34699784219265, "min": 145.8119983226061, "max": 238.18399803340435, "count": 50 }, "Pyramids.Policy.RndReward.mean": { "value": 0.028435185211646504, "min": 0.026604726313148128, "max": 0.06942069130084362, "count": 50 }, "Pyramids.Policy.RndReward.sum": { "value": 3.3553518549742876, "min": 3.3553518549742876, "max": 6.733807056181831, "count": 50 }, "Pyramids.Losses.PolicyLoss.mean": { "value": 0.019560502592163784, "min": 0.019560502592163784, "max": 0.0276279745134525, "count": 50 }, "Pyramids.Losses.PolicyLoss.sum": { "value": 0.05868150777649135, "min": 0.04262920394539833, "max": 0.08060212047537789, "count": 50 }, "Pyramids.Losses.ValueLoss.mean": { "value": 0.01643072345604499, "min": 0.014319621746738752, "max": 0.017897415434320767, "count": 50 }, "Pyramids.Losses.ValueLoss.sum": { "value": 0.04929217036813498, "min": 0.030501069389283656, "max": 0.0536922463029623, "count": 50 }, "Pyramids.Policy.LearningRate.mean": { "value": 1.6612994462666625e-06, "min": 1.6612994462666625e-06, "max": 0.00014845130051624998, "count": 50 }, "Pyramids.Policy.LearningRate.sum": { "value": 4.983898338799987e-06, "min": 4.983898338799987e-06, "max": 0.0004376169541277333, "count": 50 }, "Pyramids.Policy.Epsilon.mean": { "value": 0.10055373333333334, "min": 0.10055373333333334, "max": 0.14948375000000003, "count": 50 }, "Pyramids.Policy.Epsilon.sum": { "value": 0.3016612, "min": 0.2090047333333333, "max": 0.4458722666666667, "count": 50 }, "Pyramids.Policy.Beta.mean": { "value": 6.531795999999988e-05, "min": 6.531795999999988e-05, "max": 0.004953426625, "count": 50 }, "Pyramids.Policy.Beta.sum": { "value": 0.0001959538799999996, "min": 0.0001959538799999996, "max": 0.014602639439999999, "count": 50 }, "Pyramids.Losses.RNDLoss.mean": { "value": 0.011611025780439377, "min": 0.01159887108951807, "max": 0.02117346040904522, "count": 50 }, "Pyramids.Losses.RNDLoss.sum": { "value": 0.03483307734131813, "min": 0.02372013032436371, "max": 0.06352037936449051, "count": 50 }, "Pyramids.IsTraining.mean": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 50 }, "Pyramids.IsTraining.sum": { "value": 1.0, "min": 1.0, "max": 1.0, "count": 50 } }, "metadata": { "timer_format_version": "0.1.0", "start_time_seconds": "1746508706", "python_version": "3.10.12 | packaged by conda-forge | (main, Jun 23 2023, 22:40:32) [GCC 12.3.0]", "command_line_arguments": "/home/txshi/miniconda3/envs/hf-rl-ch5/bin/mlagents-learn ./ml-agents/config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics --resume", "mlagents_version": "1.2.0.dev0", "mlagents_envs_version": "1.2.0.dev0", "communication_protocol_version": "1.5.0", "pytorch_version": "2.7.0+cu126", "numpy_version": "1.23.5", "end_time_seconds": "1746509653" }, "total": 946.4430587530005, "count": 1, "self": 0.1665285330018378, "children": { "run_training.setup": { "total": 0.015372962998299045, "count": 1, "self": 0.015372962998299045 }, "TrainerController.start_learning": { "total": 946.2611572570004, "count": 1, "self": 0.7353149860136909, "children": { "TrainerController._reset_env": { "total": 1.3560721989997546, "count": 1, "self": 1.3560721989997546 }, "TrainerController.advance": { "total": 944.1236960439855, "count": 98280, "self": 0.6919071292486478, "children": { "env_step": { "total": 628.7653076611532, "count": 98280, "self": 501.679360544118, "children": { "SubprocessEnvManager._take_step": { "total": 126.59082360999855, "count": 98280, "self": 2.55443194534746, "children": { "TorchPolicy.evaluate": { "total": 124.03639166465109, "count": 93817, "self": 124.03639166465109 } } }, "workers": { "total": 0.4951235070366238, "count": 98280, "self": 0.0, "children": { "worker_root": { "total": 945.3021435918654, "count": 98280, "is_parallel": true, "self": 489.8738490467058, "children": { "run_training.setup": { "total": 0.0, "count": 0, "is_parallel": true, "self": 0.0, "children": { "steps_from_proto": { "total": 0.0006208550003066193, "count": 1, "is_parallel": true, "self": 0.0001753210017341189, "children": { "_process_rank_one_or_two_observation": { "total": 0.0004455339985725004, "count": 8, "is_parallel": true, "self": 0.0004455339985725004 } } }, "UnityEnvironment.step": { "total": 0.012712784000541433, "count": 1, "is_parallel": true, "self": 0.00012432600124157034, "children": { "UnityEnvironment._generate_step_input": { "total": 0.00013519099957193248, "count": 1, "is_parallel": true, "self": 0.00013519099957193248 }, "communicator.exchange": { "total": 0.012097856999389478, "count": 1, "is_parallel": true, "self": 0.012097856999389478 }, "steps_from_proto": { "total": 0.00035541000033845194, "count": 1, "is_parallel": true, "self": 8.841799717629328e-05, "children": { "_process_rank_one_or_two_observation": { "total": 0.00026699200316215865, "count": 8, "is_parallel": true, "self": 0.00026699200316215865 } } } } } } }, "UnityEnvironment.step": { "total": 455.4282945451596, "count": 98279, "is_parallel": true, "self": 10.6707104262332, "children": { "UnityEnvironment._generate_step_input": { "total": 6.716008393870652, "count": 98279, "is_parallel": true, "self": 6.716008393870652 }, "communicator.exchange": { "total": 409.69189717502195, "count": 98279, "is_parallel": true, "self": 409.69189717502195 }, "steps_from_proto": { "total": 28.349678550033786, "count": 98279, "is_parallel": true, "self": 6.308964319758161, "children": { "_process_rank_one_or_two_observation": { "total": 22.040714230275626, "count": 786232, "is_parallel": true, "self": 22.040714230275626 } } } } } } } } } } }, "trainer_advance": { "total": 314.6664812535837, "count": 98280, "self": 1.5202239386580914, "children": { "process_trajectory": { "total": 79.52096247990994, "count": 98280, "self": 79.37046390090836, "children": { "RLTrainer._checkpoint": { "total": 0.15049857900157804, "count": 3, "self": 0.15049857900157804 } } }, "_update_policy": { "total": 233.62529483501567, "count": 145, "self": 185.6884477689655, "children": { "TorchPPOOptimizer.update": { "total": 47.93684706605018, "count": 7250, "self": 47.93684706605018 } } } } } } }, "trainer_threads": { "total": 4.420016921358183e-07, "count": 1, "self": 4.420016921358183e-07 }, "TrainerController._save_models": { "total": 0.04607358599969302, "count": 1, "self": 0.0011363630001142155, "children": { "RLTrainer._checkpoint": { "total": 0.04493722299957881, "count": 1, "self": 0.04493722299957881 } } } } } } }