Edison Marcecelo Muzo Oyana

basic model

2e3f5ff almost 3 years ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.4975653886795044,
	"min": 0.47961491346359253,
	"max": 1.3951681852340698,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 14847.3515625,
	"min": 14350.078125,
	"max": 42323.8203125,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989894.0,
	"min": 29952.0,
	"max": 989894.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989894.0,
	"min": 29952.0,
	"max": 989894.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.4085873067378998,
	"min": -0.08974519371986389,
	"max": 0.4677356481552124,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 108.275634765625,
	"min": -21.449100494384766,
	"max": 127.2240982055664,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.014104614965617657,
	"min": -0.005268337205052376,
	"max": 0.25343790650367737,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 3.737722873687744,
	"min": -1.4066460132598877,
	"max": 60.064781188964844,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06710505671061397,
	"min": 0.06500589805137781,
	"max": 0.07254626382824657,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9394707939485956,
	"min": 0.5075860991809736,
	"max": 1.0320246177531465,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.01582775835001793,
	"min": 0.0003489376471918086,
	"max": 0.01644820867449097,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.221588616900251,
	"min": 0.004885127060685321,
	"max": 0.24672313011736455,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.363468974114286e-06,
	"min": 7.363468974114286e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.0001030885656376,
	"min": 0.0001030885656376,
	"max": 0.0036331561889480003,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10245445714285714,
	"min": 0.10245445714285714,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4343624,
	"min": 1.3886848,
	"max": 2.6110519999999995,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00025520026857142863,
	"min": 0.00025520026857142863,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.003572803760000001,
	"min": 0.003572803760000001,
	"max": 0.12112409480000001,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.009822138585150242,
	"min": 0.009822138585150242,
	"max": 0.4139936566352844,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.13750994205474854,
	"min": 0.13750994205474854,
	"max": 2.8979556560516357,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 389.09859154929575,
	"min": 389.09859154929575,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 27626.0,
	"min": 15984.0,
	"max": 32785.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.4136591310232458,
	"min": -1.0000000521540642,
	"max": 1.5503628332700048,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 100.36979830265045,
	"min": -29.89840167760849,
	"max": 108.52539832890034,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.4136591310232458,
	"min": -1.0000000521540642,
	"max": 1.5503628332700048,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 100.36979830265045,
	"min": -29.89840167760849,
	"max": 108.52539832890034,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.03946737707309707,
	"min": 0.03946737707309707,
	"max": 8.436937988270074,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.802183772189892,
	"min": 2.802183772189892,
	"max": 134.9910078123212,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1679827432",
	"python_version": "3.9.16 (main, Dec 7 2022, 01:11:51) \n[GCC 9.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids-Training-01 --no-graphics",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1679829642"
	},
	"total": 2209.582941508,
	"count": 1,
	"self": 0.48784612800000104,
	"children": {
	"run_training.setup": {
	"total": 0.11024874600002477,
	"count": 1,
	"self": 0.11024874600002477
	},
	"TrainerController.start_learning": {
	"total": 2208.984846634,
	"count": 1,
	"self": 1.6394397359608774,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.252175113000021,
	"count": 1,
	"self": 6.252175113000021
	},
	"TrainerController.advance": {
	"total": 2200.9970362320387,
	"count": 63574,
	"self": 1.7514847370725874,
	"children": {
	"env_step": {
	"total": 1559.8176929829783,
	"count": 63574,
	"self": 1442.1477295419309,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 116.75630156701459,
	"count": 63574,
	"self": 4.92620027300444,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 111.83010129401015,
	"count": 62556,
	"self": 111.83010129401015
	}
	}
	},
	"workers": {
	"total": 0.9136618740329823,
	"count": 63574,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2203.9800220379916,
	"count": 63574,
	"is_parallel": true,
	"self": 886.5983430489539,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.001865398000006735,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005853390000538639,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001280058999952871,
	"count": 8,
	"is_parallel": true,
	"self": 0.001280058999952871
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.08041903200000888,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005801249999421998,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0004834540000047127,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004834540000047127
	},
	"communicator.exchange": {
	"total": 0.07765766700003951,
	"count": 1,
	"is_parallel": true,
	"self": 0.07765766700003951
	},
	"steps_from_proto": {
	"total": 0.001697786000022461,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004786699998930999,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.001219116000129361,
	"count": 8,
	"is_parallel": true,
	"self": 0.001219116000129361
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1317.3816789890377,
	"count": 63573,
	"is_parallel": true,
	"self": 32.843421338983035,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 23.393729668981848,
	"count": 63573,
	"is_parallel": true,
	"self": 23.393729668981848
	},
	"communicator.exchange": {
	"total": 1164.2905567070488,
	"count": 63573,
	"is_parallel": true,
	"self": 1164.2905567070488
	},
	"steps_from_proto": {
	"total": 96.85397127402388,
	"count": 63573,
	"is_parallel": true,
	"self": 20.916294354970887,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 75.93767691905299,
	"count": 508584,
	"is_parallel": true,
	"self": 75.93767691905299
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 639.427858511988,
	"count": 63574,
	"self": 2.9213153139994574,
	"children": {
	"process_trajectory": {
	"total": 119.87786565599055,
	"count": 63574,
	"self": 119.61185070899074,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2660149469998032,
	"count": 2,
	"self": 0.2660149469998032
	}
	}
	},
	"_update_policy": {
	"total": 516.6286775419981,
	"count": 452,
	"self": 327.54881674702926,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 189.0798607949688,
	"count": 22830,
	"self": 189.0798607949688
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.0280000424245372e-06,
	"count": 1,
	"self": 1.0280000424245372e-06
	},
	"TrainerController._save_models": {
	"total": 0.09619452500010084,
	"count": 1,
	"self": 0.001404715000262513,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.09478980999983833,
	"count": 1,
	"self": 0.09478980999983833
	}
	}
	}
	}
	}
	}
	}