No defaults - 160M

49851fb over 2 years ago

20.3 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 0.29271167516708374,
	"min": 0.27912601828575134,
	"max": 3.2958128452301025,
	"count": 15999
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 11614.798828125,
	"min": 4629.82958984375,
	"max": 591558.875,
	"count": 15999
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 36.792307692307695,
	"min": 29.23170731707317,
	"max": 551.0,
	"count": 15999
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19132.0,
	"min": 15260.0,
	"max": 41060.0,
	"count": 15999
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1639.9359347156194,
	"min": 1198.128538137423,
	"max": 1680.737096359153,
	"count": 15999
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 426383.343026061,
	"min": 2397.64453146509,
	"max": 500426.5231898225,
	"count": 15999
	},
	"SoccerTwos.Step.mean": {
	"value": 159999996.0,
	"min": 9568.0,
	"max": 159999996.0,
	"count": 16000
	},
	"SoccerTwos.Step.sum": {
	"value": 159999996.0,
	"min": 9568.0,
	"max": 159999996.0,
	"count": 16000
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": 0.020044520497322083,
	"min": -0.12824246287345886,
	"max": 0.22821052372455597,
	"count": 16000
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": 5.211575508117676,
	"min": -30.2033634185791,
	"max": 49.52168273925781,
	"count": 16000
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": 0.02062523551285267,
	"min": -0.1285647302865982,
	"max": 0.22626857459545135,
	"count": 16000
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": 5.362561225891113,
	"min": -30.095096588134766,
	"max": 49.10028076171875,
	"count": 16000
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 16000
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 16000
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.09029230796373808,
	"min": -0.46440799951553347,
	"max": 0.5237547838169595,
	"count": 16000
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 23.4760000705719,
	"min": -82.58560001850128,
	"max": 93.47840017080307,
	"count": 16000
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.09029230796373808,
	"min": -0.46440799951553347,
	"max": 0.5237547838169595,
	"count": 16000
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 23.4760000705719,
	"min": -82.58560001850128,
	"max": 93.47840017080307,
	"count": 16000
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 16000
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 16000
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.012796422930356736,
	"min": 0.00885343154077418,
	"max": 0.028058637352660298,
	"count": 7774
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.012796422930356736,
	"min": 0.00885343154077418,
	"max": 0.028058637352660298,
	"count": 7774
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.07961924796303113,
	"min": 0.005778578342869878,
	"max": 0.0951485348244508,
	"count": 7774
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.07961924796303113,
	"min": 0.005778578342869878,
	"max": 0.0951485348244508,
	"count": 7774
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.0797942062218984,
	"min": 0.005859525905301173,
	"max": 0.09544695367415747,
	"count": 7774
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.0797942062218984,
	"min": 0.005859525905301173,
	"max": 0.09544695367415747,
	"count": 7774
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 5.747498117483374e-09,
	"min": 5.747498117483374e-09,
	"max": 0.000299961435012855,
	"count": 7774
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 5.747498117483374e-09,
	"min": 5.747498117483374e-09,
	"max": 0.000299961435012855,
	"count": 7774
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.25,
	"min": 0.25,
	"max": 0.25,
	"count": 7774
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.25,
	"min": 0.25,
	"max": 0.25,
	"count": 7774
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 1.0188061749999443e-05,
	"min": 1.0188061749999443e-05,
	"max": 0.009998715785499998,
	"count": 7774
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 1.0188061749999443e-05,
	"min": 1.0188061749999443e-05,
	"max": 0.009998715785499998,
	"count": 7774
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1693767407",
	"python_version": "3.9.17 (main, Jul 5 2023, 20:41:20) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/mgmeskill/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=Downstrike-160M --no-graphics --num-envs=8",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1693901136"
	},
	"total": 133728.72782940418,
	"count": 1,
	"self": 0.3201414127834141,
	"children": {
	"run_training.setup": {
	"total": 0.027171769179403782,
	"count": 1,
	"self": 0.027171769179403782
	},
	"TrainerController.start_learning": {
	"total": 133728.3805162222,
	"count": 1,
	"self": 102.86563353613019,
	"children": {
	"TrainerController._reset_env": {
	"total": 696.0709477802739,
	"count": 7947,
	"self": 696.0709477802739
	},
	"TrainerController.advance": {
	"total": 132929.13862727955,
	"count": 3507132,
	"self": 80.21517739770934,
	"children": {
	"env_step": {
	"total": 73052.17698274832,
	"count": 3507132,
	"self": 24081.407350266818,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 48880.748980567325,
	"count": 14812115,
	"self": 1211.079614217393,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 47669.66936634993,
	"count": 27112404,
	"self": 47669.66936634993
	}
	}
	},
	"workers": {
	"total": 90.02065191417933,
	"count": 3507132,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 1066995.6906433739,
	"count": 14784608,
	"is_parallel": true,
	"self": 875481.2676103334,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.01907126046717167,
	"count": 16,
	"is_parallel": true,
	"self": 0.004095900803804398,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.014975359663367271,
	"count": 64,
	"is_parallel": true,
	"self": 0.014975359663367271
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.17750767897814512,
	"count": 8,
	"is_parallel": true,
	"self": 0.006570951547473669,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.004816613160073757,
	"count": 8,
	"is_parallel": true,
	"self": 0.004816613160073757
	},
	"communicator.exchange": {
	"total": 0.14813531283289194,
	"count": 8,
	"is_parallel": true,
	"self": 0.14813531283289194
	},
	"steps_from_proto": {
	"total": 0.017984801437705755,
	"count": 16,
	"is_parallel": true,
	"self": 0.0031336508691310883,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.014851150568574667,
	"count": 64,
	"is_parallel": true,
	"self": 0.014851150568574667
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 191352.52964038588,
	"count": 14784600,
	"is_parallel": true,
	"self": 12493.37244902039,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 8003.242103095632,
	"count": 14784600,
	"is_parallel": true,
	"self": 8003.242103095632
	},
	"communicator.exchange": {
	"total": 137369.81809696788,
	"count": 14784600,
	"is_parallel": true,
	"self": 137369.81809696788
	},
	"steps_from_proto": {
	"total": 33486.09699130198,
	"count": 29569200,
	"is_parallel": true,
	"self": 5620.8086648634635,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 27865.288326438516,
	"count": 118276800,
	"is_parallel": true,
	"self": 27865.288326438516
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 161.89339265460148,
	"count": 127136,
	"is_parallel": true,
	"self": 25.868383669760078,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 136.0250089848414,
	"count": 508544,
	"is_parallel": true,
	"self": 136.0250089848414
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 59796.74646713352,
	"count": 3507132,
	"self": 1285.6652827882208,
	"children": {
	"process_trajectory": {
	"total": 24676.622614394873,
	"count": 3507132,
	"self": 24650.985279567074,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 25.63733482779935,
	"count": 80,
	"self": 25.63733482779935
	}
	}
	},
	"_update_policy": {
	"total": 33834.458569950424,
	"count": 7774,
	"self": 18988.026603292674,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 14846.43196665775,
	"count": 233220,
	"self": 14846.43196665775
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 5.522742867469788e-07,
	"count": 1,
	"self": 5.522742867469788e-07
	},
	"TrainerController._save_models": {
	"total": 0.30530707398429513,
	"count": 1,
	"self": 0.0019307197071611881,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.30337635427713394,
	"count": 1,
	"self": 0.30337635427713394
	}
	}
	}
	}
	}
	}
	}