basic params model

8e8e9ac verified over 1 year ago

20.1 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.897956371307373,
	"min": 1.897956371307373,
	"max": 3.2957069873809814,
	"count": 500
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 45672.421875,
	"min": 15056.080078125,
	"max": 111055.4921875,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 999.0,
	"min": 442.3636363636364,
	"max": 999.0,
	"count": 500
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19980.0,
	"min": 16484.0,
	"max": 26132.0,
	"count": 500
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1181.7998220046622,
	"min": 1180.786960974288,
	"max": 1199.4207269131573,
	"count": 121
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 2363.5996440093245,
	"min": 2361.573921948576,
	"max": 16738.762614794054,
	"count": 121
	},
	"SoccerTwos.Step.mean": {
	"value": 4999522.0,
	"min": 9082.0,
	"max": 4999522.0,
	"count": 500
	},
	"SoccerTwos.Step.sum": {
	"value": 4999522.0,
	"min": 9082.0,
	"max": 4999522.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 2.997626143041998e-05,
	"min": -0.08423199504613876,
	"max": 0.09491100162267685,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 0.0002997626143041998,
	"min": -0.8648865818977356,
	"max": 1.272194504737854,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 3.87626641895622e-05,
	"min": -0.10975539684295654,
	"max": 0.09483882039785385,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 0.000387626641895622,
	"min": -1.0975539684295654,
	"max": 1.306225061416626,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.0,
	"min": -0.5591692328453064,
	"max": 0.2917600005865097,
	"count": 500
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 0.0,
	"min": -8.891600012779236,
	"max": 4.376400008797646,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.0,
	"min": -0.5591692328453064,
	"max": 0.2917600005865097,
	"count": 500
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 0.0,
	"min": -8.891600012779236,
	"max": 4.376400008797646,
	"count": 500
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 500
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.01742762657328664,
	"min": 0.011112835831348396,
	"max": 0.022888927767053247,
	"count": 229
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.01742762657328664,
	"min": 0.011112835831348396,
	"max": 0.022888927767053247,
	"count": 229
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 7.469201908823682e-09,
	"min": 2.90180472983792e-09,
	"max": 0.012253172985704925,
	"count": 229
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 7.469201908823682e-09,
	"min": 2.90180472983792e-09,
	"max": 0.012253172985704925,
	"count": 229
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 1.5322401540155774e-08,
	"min": 7.1896608518547586e-09,
	"max": 0.006459781775871912,
	"count": 229
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 1.5322401540155774e-08,
	"min": 7.1896608518547586e-09,
	"max": 0.006459781775871912,
	"count": 229
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 229
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 0.0003,
	"min": 0.0003,
	"max": 0.0003,
	"count": 229
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.20000000000000007,
	"min": 0.2,
	"max": 0.20000000000000007,
	"count": 229
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.20000000000000007,
	"min": 0.2,
	"max": 0.20000000000000007,
	"count": 229
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 229
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 0.005000000000000001,
	"min": 0.005,
	"max": 0.005000000000000001,
	"count": 229
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1721424011",
	"python_version": "3.10.12 \| packaged by conda-forge \| (main, Jun 23 2023, 22:40:32) [GCC 12.3.0]",
	"command_line_arguments": "/home/evgenii/anaconda3/envs/hf_ai_vs_ai/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.exe --run-id=soccer_twos_basic_params --no-graphics",
	"mlagents_version": "1.1.0.dev0",
	"mlagents_envs_version": "1.1.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "2.3.1+cu121",
	"numpy_version": "1.23.5",
	"end_time_seconds": "1721429399"
	},
	"total": 5387.793256162,
	"count": 1,
	"self": 0.21909823100031645,
	"children": {
	"run_training.setup": {
	"total": 0.011307577000025049,
	"count": 1,
	"self": 0.011307577000025049
	},
	"TrainerController.start_learning": {
	"total": 5387.562850354,
	"count": 1,
	"self": 4.502430648020891,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.8785338079994744,
	"count": 25,
	"self": 2.8785338079994744
	},
	"TrainerController.advance": {
	"total": 5379.98944362898,
	"count": 324401,
	"self": 4.212884191760168,
	"children": {
	"env_step": {
	"total": 4177.181727042024,
	"count": 324401,
	"self": 2938.2833763098342,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 1236.2409861891056,
	"count": 324401,
	"self": 28.466274757111933,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 1207.7747114319936,
	"count": 644568,
	"self": 1207.7747114319936
	}
	}
	},
	"workers": {
	"total": 2.6573645430842703,
	"count": 324401,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 5381.82670776112,
	"count": 324401,
	"is_parallel": true,
	"self": 2992.172604458153,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0018104759999744147,
	"count": 2,
	"is_parallel": true,
	"self": 0.0005467709999322778,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0012637050000421368,
	"count": 8,
	"is_parallel": true,
	"self": 0.0012637050000421368
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.01722774800001048,
	"count": 1,
	"is_parallel": true,
	"self": 0.00037726199997223375,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0003011020000087683,
	"count": 1,
	"is_parallel": true,
	"self": 0.0003011020000087683
	},
	"communicator.exchange": {
	"total": 0.015354194000025245,
	"count": 1,
	"is_parallel": true,
	"self": 0.015354194000025245
	},
	"steps_from_proto": {
	"total": 0.0011951900000042315,
	"count": 2,
	"is_parallel": true,
	"self": 0.0002418459999660172,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0009533440000382143,
	"count": 8,
	"is_parallel": true,
	"self": 0.0009533440000382143
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 2389.6250237589657,
	"count": 324400,
	"is_parallel": true,
	"self": 125.28330025650848,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 89.37477725101326,
	"count": 324400,
	"is_parallel": true,
	"self": 89.37477725101326
	},
	"communicator.exchange": {
	"total": 1785.418480443851,
	"count": 324400,
	"is_parallel": true,
	"self": 1785.418480443851
	},
	"steps_from_proto": {
	"total": 389.54846580759283,
	"count": 648800,
	"is_parallel": true,
	"self": 75.22799380102413,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 314.3204720065687,
	"count": 2595200,
	"is_parallel": true,
	"self": 314.3204720065687
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.029079544001660906,
	"count": 48,
	"is_parallel": true,
	"self": 0.005771209000499766,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.02330833500116114,
	"count": 192,
	"is_parallel": true,
	"self": 0.02330833500116114
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 1198.5948323951952,
	"count": 324401,
	"self": 38.15757732013367,
	"children": {
	"process_trajectory": {
	"total": 324.63177605606126,
	"count": 324401,
	"self": 322.6132117540615,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 2.0185643019997315,
	"count": 10,
	"self": 2.0185643019997315
	}
	}
	},
	"_update_policy": {
	"total": 835.8054790190004,
	"count": 229,
	"self": 443.5721942590023,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 392.23328475999807,
	"count": 6873,
	"self": 392.23328475999807
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 5.330002750270069e-07,
	"count": 1,
	"self": 5.330002750270069e-07
	},
	"TrainerController._save_models": {
	"total": 0.19244173599963688,
	"count": 1,
	"self": 0.0009216989992637536,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.19152003700037312,
	"count": 1,
	"self": 0.19152003700037312
	}
	}
	}
	}
	}
	}
	}