ppo-RND-Pyramids / run_logs /timers.json

Longer time horizon

88cd07d about 3 years ago

19.2 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.327528178691864,
	"min": 0.327528178691864,
	"max": 1.4502936601638794,
	"count": 50
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 9951.6162109375,
	"min": 9951.6162109375,
	"max": 46409.3984375,
	"count": 50
	},
	"Pyramids.Step.mean": {
	"value": 1499905.0,
	"min": 29912.0,
	"max": 1499905.0,
	"count": 50
	},
	"Pyramids.Step.sum": {
	"value": 1499905.0,
	"min": 29912.0,
	"max": 1499905.0,
	"count": 50
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.7862254977226257,
	"min": -0.0986347645521164,
	"max": 0.7862254977226257,
	"count": 50
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 140.73435974121094,
	"min": -11.934806823730469,
	"max": 140.73435974121094,
	"count": 50
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": -0.021666787564754486,
	"min": -0.028470776975154877,
	"max": 0.2771379351615906,
	"count": 50
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": -3.878355026245117,
	"min": -4.783090591430664,
	"max": 33.256553649902344,
	"count": 50
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06795475266324207,
	"min": 0.06488773596184995,
	"max": 0.0760969590461734,
	"count": 50
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9513665372853889,
	"min": 0.4749415263652549,
	"max": 1.0305533156822684,
	"count": 50
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.01551100939516492,
	"min": 0.0009322263464162465,
	"max": 0.016503496621601946,
	"count": 50
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.2171541315323089,
	"min": 0.010366753799227942,
	"max": 0.22684459496111442,
	"count": 50
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 3.172570371080951e-06,
	"min": 3.172570371080951e-06,
	"max": 0.00029676708679192377,
	"count": 50
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 4.441598519513331e-05,
	"min": 4.441598519513331e-05,
	"max": 0.0033170318943227996,
	"count": 50
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10105749047619049,
	"min": 0.10105749047619049,
	"max": 0.19892236190476195,
	"count": 50
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4148048666666668,
	"min": 1.3368084666666666,
	"max": 2.5056772,
	"count": 50
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00011564329857142854,
	"min": 0.00011564329857142854,
	"max": 0.009892343954285714,
	"count": 50
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.0016190061799999996,
	"min": 0.0016190061799999996,
	"max": 0.11059715228,
	"count": 50
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.007556379772722721,
	"min": 0.007414631079882383,
	"max": 0.46072664856910706,
	"count": 50
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.10578931868076324,
	"min": 0.09769266843795776,
	"max": 3.2250864505767822,
	"count": 50
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 231.448,
	"min": 231.448,
	"max": 999.0,
	"count": 50
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 28931.0,
	"min": 15850.0,
	"max": 33465.0,
	"count": 50
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.7674719789028168,
	"min": -1.0000000596046448,
	"max": 1.7674719789028168,
	"count": 50
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 220.9339973628521,
	"min": -28.582001954317093,
	"max": 225.87839779257774,
	"count": 50
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.7674719789028168,
	"min": -1.0000000596046448,
	"max": 1.7674719789028168,
	"count": 50
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 220.9339973628521,
	"min": -28.582001954317093,
	"max": 225.87839779257774,
	"count": 50
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.018012536310357975,
	"min": 0.018012536310357975,
	"max": 7.0311954423137335,
	"count": 50
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 2.2515670387947466,
	"min": 2.2515670387947466,
	"max": 161.71749517321587,
	"count": 50
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 50
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 50
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1673509934",
	"python_version": "3.8.16 (default, Dec 7 2022, 01:12:13) \n[GCC 7.5.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids2 --no-graphics",
	"mlagents_version": "0.29.0.dev0",
	"mlagents_envs_version": "0.29.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.8.1+cu102",
	"numpy_version": "1.21.6",
	"end_time_seconds": "1673512371"
	},
	"total": 2436.2943086840005,
	"count": 1,
	"self": 0.3218447830004152,
	"children": {
	"run_training.setup": {
	"total": 0.1023755930000334,
	"count": 1,
	"self": 0.1023755930000334
	},
	"TrainerController.start_learning": {
	"total": 2435.870088308,
	"count": 1,
	"self": 1.630570045843342,
	"children": {
	"TrainerController._reset_env": {
	"total": 6.004141104000155,
	"count": 1,
	"self": 6.004141104000155
	},
	"TrainerController.advance": {
	"total": 2428.1481303021565,
	"count": 96814,
	"self": 1.7727840980787732,
	"children": {
	"env_step": {
	"total": 1485.060660868984,
	"count": 96814,
	"self": 1336.6898835476986,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 147.30312773816877,
	"count": 96814,
	"self": 6.095399021332014,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 141.20772871683675,
	"count": 93858,
	"self": 47.62053048175494,
	"children": {
	"TorchPolicy.sample_actions": {
	"total": 93.58719823508181,
	"count": 93858,
	"self": 93.58719823508181
	}
	}
	}
	}
	},
	"workers": {
	"total": 1.0676495831166903,
	"count": 96814,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2432.3293087098527,
	"count": 96814,
	"is_parallel": true,
	"self": 1224.0753513419404,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.001793319999706,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006566319998455583,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0011366879998604418,
	"count": 8,
	"is_parallel": true,
	"self": 0.0011366879998604418
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.03690019999976357,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005673259984178003,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005458120003822842,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005458120003822842
	},
	"communicator.exchange": {
	"total": 0.033989833000305225,
	"count": 1,
	"is_parallel": true,
	"self": 0.033989833000305225
	},
	"steps_from_proto": {
	"total": 0.0017972290006582625,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004644370001187781,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0013327920005394844,
	"count": 8,
	"is_parallel": true,
	"self": 0.0013327920005394844
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1208.2539573679123,
	"count": 96813,
	"is_parallel": true,
	"self": 24.264287808257905,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 18.58284851092958,
	"count": 96813,
	"is_parallel": true,
	"self": 18.58284851092958
	},
	"communicator.exchange": {
	"total": 1072.1948206297984,
	"count": 96813,
	"is_parallel": true,
	"self": 1072.1948206297984
	},
	"steps_from_proto": {
	"total": 93.21200041892644,
	"count": 96813,
	"is_parallel": true,
	"self": 21.30576312638459,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 71.90623729254185,
	"count": 774504,
	"is_parallel": true,
	"self": 71.90623729254185
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 941.3146853350936,
	"count": 96814,
	"self": 3.4799849491882924,
	"children": {
	"process_trajectory": {
	"total": 194.82750869390202,
	"count": 96814,
	"self": 194.55047395990186,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.27703473400015355,
	"count": 3,
	"self": 0.27703473400015355
	}
	}
	},
	"_update_policy": {
	"total": 743.0071916920033,
	"count": 648,
	"self": 282.6112319938966,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 460.3959596981067,
	"count": 34233,
	"self": 460.3959596981067
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 9.509994924883358e-07,
	"count": 1,
	"self": 9.509994924883358e-07
	},
	"TrainerController._save_models": {
	"total": 0.08724590500060003,
	"count": 1,
	"self": 0.0012740770007440005,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08597182799985603,
	"count": 1,
	"self": 0.08597182799985603
	}
	}
	}
	}
	}
	}
	}