papepipopu's picture
Yo
12592be
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.1642003357410431,
"min": 0.16056354343891144,
"max": 1.4807732105255127,
"count": 100
},
"Pyramids.Policy.Entropy.sum": {
"value": 4920.755859375,
"min": 4804.06103515625,
"max": 44920.734375,
"count": 100
},
"Pyramids.Step.mean": {
"value": 2999947.0,
"min": 29952.0,
"max": 2999947.0,
"count": 100
},
"Pyramids.Step.sum": {
"value": 2999947.0,
"min": 29952.0,
"max": 2999947.0,
"count": 100
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.6865847706794739,
"min": -0.1346987932920456,
"max": 0.8179547786712646,
"count": 100
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 199.10958862304688,
"min": -32.32770919799805,
"max": 242.81996154785156,
"count": 100
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": 0.008287320844829082,
"min": -0.04137527570128441,
"max": 0.2740214467048645,
"count": 100
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": 2.403323173522949,
"min": -10.426569938659668,
"max": 65.46407318115234,
"count": 100
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.06797425576951353,
"min": 0.06472775858682801,
"max": 0.07328293041290852,
"count": 100
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9516395807731896,
"min": 0.47834217100405546,
"max": 1.0798985781558956,
"count": 100
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.013280468275687391,
"min": 0.0008633737378850455,
"max": 0.015937679237963277,
"count": 100
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.18592655585962348,
"min": 0.010100517988168325,
"max": 0.2231275093314859,
"count": 100
},
"Pyramids.Policy.LearningRate.mean": {
"value": 1.4504709451142875e-06,
"min": 1.4504709451142875e-06,
"max": 0.00029838354339596195,
"count": 100
},
"Pyramids.Policy.LearningRate.sum": {
"value": 2.0306593231600025e-05,
"min": 2.0306593231600025e-05,
"max": 0.003937233687588832,
"count": 100
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10048345714285714,
"min": 0.10048345714285714,
"max": 0.19946118095238097,
"count": 100
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4067684,
"min": 1.3897045333333333,
"max": 2.812411166666667,
"count": 100
},
"Pyramids.Policy.Beta.mean": {
"value": 5.8297368571428634e-05,
"min": 5.8297368571428634e-05,
"max": 0.009946171977142856,
"count": 100
},
"Pyramids.Policy.Beta.sum": {
"value": 0.0008161631600000008,
"min": 0.0008161631600000008,
"max": 0.13125987555,
"count": 100
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.004726450890302658,
"min": 0.0044143847189843655,
"max": 0.4417647421360016,
"count": 100
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.06617031246423721,
"min": 0.06180138885974884,
"max": 3.092353105545044,
"count": 100
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 264.3644859813084,
"min": 224.79032258064515,
"max": 999.0,
"count": 100
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 28287.0,
"min": 15984.0,
"max": 32082.0,
"count": 100
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 1.7169420439227718,
"min": -1.0000000521540642,
"max": 1.775209667701875,
"count": 100
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 183.7127986997366,
"min": -32.000001668930054,
"max": 229.11859840154648,
"count": 100
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 1.7169420439227718,
"min": -1.0000000521540642,
"max": 1.775209667701875,
"count": 100
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 183.7127986997366,
"min": -32.000001668930054,
"max": 229.11859840154648,
"count": 100
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.013199198651062238,
"min": 0.010884598844797673,
"max": 9.43246571533382,
"count": 100
},
"Pyramids.Policy.RndReward.sum": {
"value": 1.4123142556636594,
"min": 1.329719188332092,
"max": 150.9194514453411,
"count": 100
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 100
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 100
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1691840274",
"python_version": "3.10.12 (main, Jun 11 2023, 05:26:28) [GCC 11.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1691847321"
},
"total": 7047.049745183001,
"count": 1,
"self": 1.0374780419997478,
"children": {
"run_training.setup": {
"total": 0.06228860799978975,
"count": 1,
"self": 0.06228860799978975
},
"TrainerController.start_learning": {
"total": 7045.949978533001,
"count": 1,
"self": 3.8242003819214005,
"children": {
"TrainerController._reset_env": {
"total": 4.370690222000121,
"count": 1,
"self": 4.370690222000121
},
"TrainerController.advance": {
"total": 7037.607241682081,
"count": 194153,
"self": 3.8922108027318245,
"children": {
"env_step": {
"total": 5075.524332072416,
"count": 194153,
"self": 4763.660695574962,
"children": {
"SubprocessEnvManager._take_step": {
"total": 309.54089548233947,
"count": 194153,
"self": 13.776553553249187,
"children": {
"TorchPolicy.evaluate": {
"total": 295.7643419290903,
"count": 187553,
"self": 295.7643419290903
}
}
},
"workers": {
"total": 2.3227410151143886,
"count": 194153,
"self": 0.0,
"children": {
"worker_root": {
"total": 7030.802261830786,
"count": 194153,
"is_parallel": true,
"self": 2605.1339650489035,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0017717289999836794,
"count": 1,
"is_parallel": true,
"self": 0.0005805659998259216,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0011911630001577578,
"count": 8,
"is_parallel": true,
"self": 0.0011911630001577578
}
}
},
"UnityEnvironment.step": {
"total": 0.04692590700005894,
"count": 1,
"is_parallel": true,
"self": 0.0005581739999342972,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00047111300000324263,
"count": 1,
"is_parallel": true,
"self": 0.00047111300000324263
},
"communicator.exchange": {
"total": 0.044171782000148596,
"count": 1,
"is_parallel": true,
"self": 0.044171782000148596
},
"steps_from_proto": {
"total": 0.0017248379999728058,
"count": 1,
"is_parallel": true,
"self": 0.0003541170001426508,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.001370720999830155,
"count": 8,
"is_parallel": true,
"self": 0.001370720999830155
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 4425.668296781882,
"count": 194152,
"is_parallel": true,
"self": 100.78579607497795,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 66.34427626294041,
"count": 194152,
"is_parallel": true,
"self": 66.34427626294041
},
"communicator.exchange": {
"total": 3949.1558300309325,
"count": 194152,
"is_parallel": true,
"self": 3949.1558300309325
},
"steps_from_proto": {
"total": 309.382394413032,
"count": 194152,
"is_parallel": true,
"self": 59.938961736002966,
"children": {
"_process_rank_one_or_two_observation": {
"total": 249.44343267702902,
"count": 1553216,
"is_parallel": true,
"self": 249.44343267702902
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 1958.1906988069331,
"count": 194153,
"self": 7.614389938843942,
"children": {
"process_trajectory": {
"total": 335.4976165240587,
"count": 194153,
"self": 334.8579583170599,
"children": {
"RLTrainer._checkpoint": {
"total": 0.6396582069987744,
"count": 6,
"self": 0.6396582069987744
}
}
},
"_update_policy": {
"total": 1615.0786923440305,
"count": 1390,
"self": 1056.648241502924,
"children": {
"TorchPPOOptimizer.update": {
"total": 558.4304508411064,
"count": 68385,
"self": 558.4304508411064
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.4689994713990018e-06,
"count": 1,
"self": 1.4689994713990018e-06
},
"TrainerController._save_models": {
"total": 0.14784477799912565,
"count": 1,
"self": 0.001945748999787611,
"children": {
"RLTrainer._checkpoint": {
"total": 0.14589902899933804,
"count": 1,
"self": 0.14589902899933804
}
}
}
}
}
}
}