yeounyi's picture
First Push
9023e87
{
"name": "root",
"gauges": {
"Pyramids.Policy.Entropy.mean": {
"value": 0.41059887409210205,
"min": 0.4031032621860504,
"max": 1.4772595167160034,
"count": 33
},
"Pyramids.Policy.Entropy.sum": {
"value": 12271.9794921875,
"min": 12125.345703125,
"max": 44814.14453125,
"count": 33
},
"Pyramids.Step.mean": {
"value": 989963.0,
"min": 29952.0,
"max": 989963.0,
"count": 33
},
"Pyramids.Step.sum": {
"value": 989963.0,
"min": 29952.0,
"max": 989963.0,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
"value": 0.15164965391159058,
"min": -0.10896016657352448,
"max": 0.15164965391159058,
"count": 33
},
"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
"value": 38.36736297607422,
"min": -26.2593994140625,
"max": 38.36736297607422,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.mean": {
"value": -0.006919424515217543,
"min": -0.006919424515217543,
"max": 0.26137885451316833,
"count": 33
},
"Pyramids.Policy.RndValueEstimate.sum": {
"value": -1.7506144046783447,
"min": -1.7506144046783447,
"max": 62.730926513671875,
"count": 33
},
"Pyramids.Losses.PolicyLoss.mean": {
"value": 0.0687537761204563,
"min": 0.06484396541452019,
"max": 0.07319275093416275,
"count": 33
},
"Pyramids.Losses.PolicyLoss.sum": {
"value": 0.9625528656863882,
"min": 0.49531079947629986,
"max": 1.063081136517747,
"count": 33
},
"Pyramids.Losses.ValueLoss.mean": {
"value": 0.00787608151501957,
"min": 0.0003182225448021127,
"max": 0.00912399763408411,
"count": 33
},
"Pyramids.Losses.ValueLoss.sum": {
"value": 0.11026514121027398,
"min": 0.004455115627229578,
"max": 0.12773596687717753,
"count": 33
},
"Pyramids.Policy.LearningRate.mean": {
"value": 2.565547434550001e-06,
"min": 2.565547434550001e-06,
"max": 9.838354447360002e-05,
"count": 33
},
"Pyramids.Policy.LearningRate.sum": {
"value": 3.591766408370001e-05,
"min": 3.591766408370001e-05,
"max": 0.0010842290157711998,
"count": 33
},
"Pyramids.Policy.Epsilon.mean": {
"value": 0.10256545000000002,
"min": 0.10256545000000002,
"max": 0.19838354285714285,
"count": 33
},
"Pyramids.Policy.Epsilon.sum": {
"value": 1.4359163000000001,
"min": 1.3691136000000002,
"max": 2.3842288000000003,
"count": 33
},
"Pyramids.Policy.Beta.mean": {
"value": 0.00026628845500000013,
"min": 0.00026628845500000013,
"max": 0.00983851593142857,
"count": 33
},
"Pyramids.Policy.Beta.sum": {
"value": 0.0037280383700000015,
"min": 0.0037280383700000015,
"max": 0.10844445711999999,
"count": 33
},
"Pyramids.Losses.RNDLoss.mean": {
"value": 0.00891942624002695,
"min": 0.00873647816479206,
"max": 0.4181419909000397,
"count": 33
},
"Pyramids.Losses.RNDLoss.sum": {
"value": 0.12487196922302246,
"min": 0.12231069058179855,
"max": 2.9269938468933105,
"count": 33
},
"Pyramids.Environment.EpisodeLength.mean": {
"value": 698.0,
"min": 674.2222222222222,
"max": 999.0,
"count": 33
},
"Pyramids.Environment.EpisodeLength.sum": {
"value": 30014.0,
"min": 15984.0,
"max": 32810.0,
"count": 33
},
"Pyramids.Environment.CumulativeReward.mean": {
"value": 0.6041069467400395,
"min": -1.0000000521540642,
"max": 0.6145066372222371,
"count": 33
},
"Pyramids.Environment.CumulativeReward.sum": {
"value": 25.9765987098217,
"min": -32.000001668930054,
"max": 27.652798675000668,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.mean": {
"value": 0.6041069467400395,
"min": -1.0000000521540642,
"max": 0.6145066372222371,
"count": 33
},
"Pyramids.Policy.ExtrinsicReward.sum": {
"value": 25.9765987098217,
"min": -32.000001668930054,
"max": 27.652798675000668,
"count": 33
},
"Pyramids.Policy.RndReward.mean": {
"value": 0.06433771157956704,
"min": 0.06433771157956704,
"max": 8.168297654017806,
"count": 33
},
"Pyramids.Policy.RndReward.sum": {
"value": 2.7665215979213826,
"min": 2.576814963016659,
"max": 130.6927624642849,
"count": 33
},
"Pyramids.IsTraining.mean": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
},
"Pyramids.IsTraining.sum": {
"value": 1.0,
"min": 1.0,
"max": 1.0,
"count": 33
}
},
"metadata": {
"timer_format_version": "0.1.0",
"start_time_seconds": "1688542495",
"python_version": "3.10.12 (main, Jun 7 2023, 12:45:35) [GCC 9.4.0]",
"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
"mlagents_version": "0.31.0.dev0",
"mlagents_envs_version": "0.31.0.dev0",
"communication_protocol_version": "1.5.0",
"pytorch_version": "1.11.0+cu102",
"numpy_version": "1.21.2",
"end_time_seconds": "1688544470"
},
"total": 1975.006288345,
"count": 1,
"self": 0.4307719799999177,
"children": {
"run_training.setup": {
"total": 0.04151585200008867,
"count": 1,
"self": 0.04151585200008867
},
"TrainerController.start_learning": {
"total": 1974.5340005130001,
"count": 1,
"self": 1.2786678899176422,
"children": {
"TrainerController._reset_env": {
"total": 4.125409566999906,
"count": 1,
"self": 4.125409566999906
},
"TrainerController.advance": {
"total": 1969.0315315550824,
"count": 63186,
"self": 1.319476776069223,
"children": {
"env_step": {
"total": 1330.6255264789986,
"count": 63186,
"self": 1222.6821296489834,
"children": {
"SubprocessEnvManager._take_step": {
"total": 107.19564306599227,
"count": 63186,
"self": 4.565628669002649,
"children": {
"TorchPolicy.evaluate": {
"total": 102.63001439698962,
"count": 62560,
"self": 102.63001439698962
}
}
},
"workers": {
"total": 0.7477537640230594,
"count": 63186,
"self": 0.0,
"children": {
"worker_root": {
"total": 1970.2145186460261,
"count": 63186,
"is_parallel": true,
"self": 855.269954903044,
"children": {
"run_training.setup": {
"total": 0.0,
"count": 0,
"is_parallel": true,
"self": 0.0,
"children": {
"steps_from_proto": {
"total": 0.0017130789999555418,
"count": 1,
"is_parallel": true,
"self": 0.0005660990000251331,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0011469799999304087,
"count": 8,
"is_parallel": true,
"self": 0.0011469799999304087
}
}
},
"UnityEnvironment.step": {
"total": 0.05049503399993682,
"count": 1,
"is_parallel": true,
"self": 0.0005536770000844626,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 0.00047885300000416464,
"count": 1,
"is_parallel": true,
"self": 0.00047885300000416464
},
"communicator.exchange": {
"total": 0.04760029499993834,
"count": 1,
"is_parallel": true,
"self": 0.04760029499993834
},
"steps_from_proto": {
"total": 0.0018622089999098534,
"count": 1,
"is_parallel": true,
"self": 0.00035314099989136594,
"children": {
"_process_rank_one_or_two_observation": {
"total": 0.0015090680000184875,
"count": 8,
"is_parallel": true,
"self": 0.0015090680000184875
}
}
}
}
}
}
},
"UnityEnvironment.step": {
"total": 1114.9445637429822,
"count": 63185,
"is_parallel": true,
"self": 32.80401861406426,
"children": {
"UnityEnvironment._generate_step_input": {
"total": 22.075887652001143,
"count": 63185,
"is_parallel": true,
"self": 22.075887652001143
},
"communicator.exchange": {
"total": 961.0932881209783,
"count": 63185,
"is_parallel": true,
"self": 961.0932881209783
},
"steps_from_proto": {
"total": 98.97136935593858,
"count": 63185,
"is_parallel": true,
"self": 18.91882208701702,
"children": {
"_process_rank_one_or_two_observation": {
"total": 80.05254726892156,
"count": 505480,
"is_parallel": true,
"self": 80.05254726892156
}
}
}
}
}
}
}
}
}
}
},
"trainer_advance": {
"total": 637.0865283000145,
"count": 63186,
"self": 2.335330970977566,
"children": {
"process_trajectory": {
"total": 106.39444919504047,
"count": 63186,
"self": 106.19011161304059,
"children": {
"RLTrainer._checkpoint": {
"total": 0.20433758199988006,
"count": 2,
"self": 0.20433758199988006
}
}
},
"_update_policy": {
"total": 528.3567481339965,
"count": 437,
"self": 336.5212414470078,
"children": {
"TorchPPOOptimizer.update": {
"total": 191.83550668698865,
"count": 22848,
"self": 191.83550668698865
}
}
}
}
}
}
},
"trainer_threads": {
"total": 1.1189999895577785e-06,
"count": 1,
"self": 1.1189999895577785e-06
},
"TrainerController._save_models": {
"total": 0.09839038200016148,
"count": 1,
"self": 0.0017902539998431166,
"children": {
"RLTrainer._checkpoint": {
"total": 0.09660012800031836,
"count": 1,
"self": 0.09660012800031836
}
}
}
}
}
}
}