First Push

ceb133a verified 9 months ago

18.7 kB

	{
	"name": "root",
	"gauges": {
	"Pyramids.Policy.Entropy.mean": {
	"value": 0.4789277911186218,
	"min": 0.4567798972129822,
	"max": 1.493379831314087,
	"count": 33
	},
	"Pyramids.Policy.Entropy.sum": {
	"value": 14306.53125,
	"min": 13710.705078125,
	"max": 45303.171875,
	"count": 33
	},
	"Pyramids.Step.mean": {
	"value": 989948.0,
	"min": 29952.0,
	"max": 989948.0,
	"count": 33
	},
	"Pyramids.Step.sum": {
	"value": 989948.0,
	"min": 29952.0,
	"max": 989948.0,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.156187042593956,
	"min": -0.1038445234298706,
	"max": 0.15641452372074127,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicValueEstimate.sum": {
	"value": 39.20294952392578,
	"min": -24.982479095458984,
	"max": 39.20294952392578,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.mean": {
	"value": 0.0020229294896125793,
	"min": 0.0020229294896125793,
	"max": 0.3120591640472412,
	"count": 33
	},
	"Pyramids.Policy.RndValueEstimate.sum": {
	"value": 0.5077552795410156,
	"min": 0.5077552795410156,
	"max": 73.95802307128906,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.mean": {
	"value": 0.06981141406074896,
	"min": 0.06482777008981509,
	"max": 0.07376855688787709,
	"count": 33
	},
	"Pyramids.Losses.PolicyLoss.sum": {
	"value": 1.0471712109112346,
	"min": 0.476110151833413,
	"max": 1.0471712109112346,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.mean": {
	"value": 0.011120647125324085,
	"min": 0.0007657034386159787,
	"max": 0.011120647125324085,
	"count": 33
	},
	"Pyramids.Losses.ValueLoss.sum": {
	"value": 0.16680970687986127,
	"min": 0.007609752863259176,
	"max": 0.16680970687986127,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.mean": {
	"value": 7.474217508626667e-06,
	"min": 7.474217508626667e-06,
	"max": 0.00029515063018788575,
	"count": 33
	},
	"Pyramids.Policy.LearningRate.sum": {
	"value": 0.0001121132626294,
	"min": 0.0001121132626294,
	"max": 0.0035072351309216997,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.mean": {
	"value": 0.10249137333333334,
	"min": 0.10249137333333334,
	"max": 0.19838354285714285,
	"count": 33
	},
	"Pyramids.Policy.Epsilon.sum": {
	"value": 1.5373706000000003,
	"min": 1.3691136000000002,
	"max": 2.569078300000001,
	"count": 33
	},
	"Pyramids.Policy.Beta.mean": {
	"value": 0.000258888196,
	"min": 0.000258888196,
	"max": 0.00983851593142857,
	"count": 33
	},
	"Pyramids.Policy.Beta.sum": {
	"value": 0.00388332294,
	"min": 0.00388332294,
	"max": 0.11693092217,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.mean": {
	"value": 0.013961868360638618,
	"min": 0.013948006555438042,
	"max": 0.44069403409957886,
	"count": 33
	},
	"Pyramids.Losses.RNDLoss.sum": {
	"value": 0.20942802727222443,
	"min": 0.19527208805084229,
	"max": 3.0848581790924072,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.mean": {
	"value": 665.7173913043479,
	"min": 665.7173913043479,
	"max": 999.0,
	"count": 33
	},
	"Pyramids.Environment.EpisodeLength.sum": {
	"value": 30623.0,
	"min": 15984.0,
	"max": 32336.0,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.mean": {
	"value": 0.812365185469389,
	"min": -1.0000000521540642,
	"max": 0.812365185469389,
	"count": 33
	},
	"Pyramids.Environment.CumulativeReward.sum": {
	"value": 37.36879853159189,
	"min": -32.000001668930054,
	"max": 37.36879853159189,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.mean": {
	"value": 0.812365185469389,
	"min": -1.0000000521540642,
	"max": 0.812365185469389,
	"count": 33
	},
	"Pyramids.Policy.ExtrinsicReward.sum": {
	"value": 37.36879853159189,
	"min": -32.000001668930054,
	"max": 37.36879853159189,
	"count": 33
	},
	"Pyramids.Policy.RndReward.mean": {
	"value": 0.09475868726250432,
	"min": 0.09475868726250432,
	"max": 9.12141172029078,
	"count": 33
	},
	"Pyramids.Policy.RndReward.sum": {
	"value": 4.358899614075199,
	"min": 4.132417161308695,
	"max": 145.94258752465248,
	"count": 33
	},
	"Pyramids.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	},
	"Pyramids.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 33
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1743513556",
	"python_version": "3.10.12 (main, Jul 5 2023, 18:54:27) [GCC 11.2.0]",
	"command_line_arguments": "/usr/local/bin/mlagents-learn ./config/ppo/PyramidsRND.yaml --env=./training-envs-executables/linux/Pyramids/Pyramids --run-id=Pyramids Training --no-graphics",
	"mlagents_version": "1.2.0.dev0",
	"mlagents_envs_version": "1.2.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.6.0+cu124",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1743515546"
	},
	"total": 1989.6591349689998,
	"count": 1,
	"self": 0.7427212159996088,
	"children": {
	"run_training.setup": {
	"total": 0.037944934999984525,
	"count": 1,
	"self": 0.037944934999984525
	},
	"TrainerController.start_learning": {
	"total": 1988.878468818,
	"count": 1,
	"self": 1.2708240650110838,
	"children": {
	"TrainerController._reset_env": {
	"total": 3.829117714000006,
	"count": 1,
	"self": 3.829117714000006
	},
	"TrainerController.advance": {
	"total": 1983.6834362239888,
	"count": 63244,
	"self": 1.3471865479989447,
	"children": {
	"env_step": {
	"total": 1313.056961843982,
	"count": 63244,
	"self": 1166.41025271399,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 145.9260778480134,
	"count": 63244,
	"self": 4.418740220968857,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 141.50733762704454,
	"count": 62568,
	"self": 141.50733762704454
	}
	}
	},
	"workers": {
	"total": 0.7206312819784557,
	"count": 63244,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 1984.4947825860197,
	"count": 63244,
	"is_parallel": true,
	"self": 922.2681450270554,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0053213600000390215,
	"count": 1,
	"is_parallel": true,
	"self": 0.0035178290001454116,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.00180353099989361,
	"count": 8,
	"is_parallel": true,
	"self": 0.00180353099989361
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.048582285999998476,
	"count": 1,
	"is_parallel": true,
	"self": 0.0005956889999652049,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.00046176199998626544,
	"count": 1,
	"is_parallel": true,
	"self": 0.00046176199998626544
	},
	"communicator.exchange": {
	"total": 0.045807532000026185,
	"count": 1,
	"is_parallel": true,
	"self": 0.045807532000026185
	},
	"steps_from_proto": {
	"total": 0.00171730300002082,
	"count": 1,
	"is_parallel": true,
	"self": 0.0004950490001078833,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012222539999129367,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012222539999129367
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 1062.2266375589643,
	"count": 63243,
	"is_parallel": true,
	"self": 31.41921442998455,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 22.381173736999415,
	"count": 63243,
	"is_parallel": true,
	"self": 22.381173736999415
	},
	"communicator.exchange": {
	"total": 916.7867777569652,
	"count": 63243,
	"is_parallel": true,
	"self": 916.7867777569652
	},
	"steps_from_proto": {
	"total": 91.63947163501496,
	"count": 63243,
	"is_parallel": true,
	"self": 17.98900764903209,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 73.65046398598287,
	"count": 505944,
	"is_parallel": true,
	"self": 73.65046398598287
	}
	}
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 669.2792878320079,
	"count": 63244,
	"self": 2.374071500027526,
	"children": {
	"process_trajectory": {
	"total": 123.44113914997854,
	"count": 63244,
	"self": 123.1559100419787,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.28522910799983947,
	"count": 2,
	"self": 0.28522910799983947
	}
	}
	},
	"_update_policy": {
	"total": 543.4640771820018,
	"count": 444,
	"self": 300.30302516500745,
	"children": {
	"TorchPPOOptimizer.update": {
	"total": 243.16105201699435,
	"count": 22809,
	"self": 243.16105201699435
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 8.780002644925844e-07,
	"count": 1,
	"self": 8.780002644925844e-07
	},
	"TrainerController._save_models": {
	"total": 0.09508993700001156,
	"count": 1,
	"self": 0.0014623689999098133,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.09362756800010175,
	"count": 1,
	"self": 0.09362756800010175
	}
	}
	}
	}
	}
	}
	}