First Push

a7b2076 verified almost 2 years ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.35659268498420715,
	"min": 0.35659268498420715,
	"max": 1.4464179277420044,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 10766.24609375,
	"min": 10766.24609375,
	"max": 43878.53515625,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989998.0,
	"min": 29952.0,
	"max": 989998.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989998.0,
	"min": 29952.0,
	"max": 989998.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.5554537177085876,
	"min": -0.08762737363576889,
	"max": 0.5883548855781555,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 154.4161376953125,
	"min": -21.030569076538086,
	"max": 165.91607666015625,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.07612387835979462,
	"min": -0.0440775603055954,
	"max": 0.3590862452983856,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 21.162437438964844,
	"min": -11.283855438232422,
	"max": 85.10343933105469,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06769165315519622,
	"min": 0.06374670580167276,
	"max": 0.07148971865812183,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 0.9476831441727471,
	"min": 0.5000597667509366,
	"max": 1.0687312037266299,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.012951851048412556,
	"min": 0.0004213311831797018,
	"max": 0.015387932273105712,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.18132591467777578,
	"min": 0.005477305381336123,
	"max": 0.21543105182347996,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.617418889464286e-06,
	"min": 7.617418889464286e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.00010664386445250001,
	"min": 0.00010664386445250001,
	"max": 0.0034930540356486995,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10253910714285716,
	"min": 0.10253910714285716,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.4355475000000002,
	"min": 1.3886848,
	"max": 2.5276006000000004,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.00026365680357142855,
	"min": 0.00026365680357142855,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.00369119525,
	"min": 0.00369119525,
	"max": 0.11644869486999998,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.012202026322484016,
	"min": 0.012049351818859577,
	"max": 0.5200421214103699,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.17082837224006653,
	"min": 0.16869091987609863,
	"max": 3.6402950286865234,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 350.8780487804878,
	"min": 327.14606741573033,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 28772.0,
	"min": 15984.0,
	"max": 33322.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 1.5758268153522073,
	"min": -1.0000000521540642,
	"max": 1.6624130206587522,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 129.217798858881,
	"min": -31.996801674365997,
	"max": 152.9419979006052,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 1.5758268153522073,
	"min": -1.0000000521540642,
	"max": 1.6624130206587522,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 129.217798858881,
	"min": -31.996801674365997,
	"max": 152.9419979006052,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.04456620345391878,
	"min": 0.04192256064937722,
	"max": 11.078681353479624,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 3.65442868322134,
	"min": 3.65442868322134,
	"max": 177.25890165567398,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1712944083",
	"python_version": "3.10.12 (main, Nov 20 2023, 15:14:05) [GCC 11.4.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.2.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1712946511"
	},
	"total": 2427.5327057490003,
	"count": 1,
	"self": 0.5307231530000536,
	"children": {
	"run_training.setup": {
	"total": 0.08889312700011942,
	"count": 1,
	"self": 0.08889312700011942
	},
	"TrainerController.start_learning": {
	"total": 2426.913089469,
	"count": 1,
	"self": 1.5716157070332883,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.290314542000033,
	"count": 1,
	"self": 2.290314542000033
	},
	"TrainerController.advance": {
	"total": 2422.959735101967,
	"count": 63809,
	"self": 1.6175734618341266,
	"children": {
	"env_step": {
	"total": 1766.398982187056,
	"count": 63809,
	"self": 1621.4609890211464,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 143.93898208093697,
	"count": 63809,
	"self": 5.3297580839634975,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 138.60922399697347,
	"count": 62575,
	"self": 138.60922399697347
	}
	}
	},
	"workers": {
	"total": 0.9990110849726079,
	"count": 63809,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 2421.3830879441794,
	"count": 63809,
	"is_parallel": true,
	"self": 938.3398763641949,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.002177285000016127,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006832979993305344,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0014939870006855926,
	"count": 8,
	"is_parallel": true,
	"self": 0.0014939870006855926
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.04973701400012942,
	"count": 1,
	"is_parallel": true,
	"self": 0.0006779780005672364,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0005907099998694321,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005907099998694321
	},
	"communicator.exchange": {
	"total": 0.04643153300003178,
	"count": 1,
	"is_parallel": true,
	"self": 0.04643153300003178
	},
	"steps_from_proto": {
	"total": 0.0020367929996609746,
	"count": 1,
	"is_parallel": true,
	"self": 0.00043388699987190193,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0016029059997890727,
	"count": 8,
	"is_parallel": true,
	"self": 0.0016029059997890727
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1483.0432115799845,
	"count": 63808,
	"is_parallel": true,
	"self": 38.22040997188196,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 27.009885376994134,
	"count": 63808,
	"is_parallel": true,
	"self": 27.009885376994134
	},
	"communicator.exchange": {
	"total": 1303.231241952009,
	"count": 63808,
	"is_parallel": true,
	"self": 1303.231241952009
	},
	"steps_from_proto": {
	"total": 114.58167427909939,
	"count": 63808,
	"is_parallel": true,
	"self": 23.90159641218588,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 90.6800778669135,
	"count": 510464,
	"is_parallel": true,
	"self": 90.6800778669135
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 654.9431794530769,
	"count": 63809,
	"self": 2.99216254615294,
	"children": {
	"process_trajectory": {
	"total": 137.06190282793023,
	"count": 63809,
	"self": 136.85910823292988,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.20279459500034136,
	"count": 2,
	"self": 0.20279459500034136
	}
	}
	},
	"_update_policy": {
	"total": 514.8891140789938,
	"count": 452,
	"self": 303.8535244889631,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 211.03558959003067,
	"count": 22809,
	"self": 211.03558959003067
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.038999471347779e-06,
	"count": 1,
	"self": 1.038999471347779e-06
	},
	"TrainerController._save_models": {
	"total": 0.0914230790003785,
	"count": 1,
	"self": 0.0016222490003201528,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.08980083000005834,
	"count": 1,
	"self": 0.08980083000005834
	}
	}
	}
	}
	}
	}
	}