First Push

f2a103d almost 3 years ago

20.3 kB

	{
	"name": "root",
	"gauges": {
	"SoccerTwos.Policy.Entropy.mean": {
	"value": 1.5031105279922485,
	"min": 1.4853661060333252,
	"max": 3.295753240585327,
	"count": 600
	},
	"SoccerTwos.Policy.Entropy.sum": {
	"value": 30302.708984375,
	"min": 15746.2822265625,
	"max": 105464.1015625,
	"count": 600
	},
	"SoccerTwos.Environment.EpisodeLength.mean": {
	"value": 44.648148148148145,
	"min": 38.67460317460318,
	"max": 999.0,
	"count": 600
	},
	"SoccerTwos.Environment.EpisodeLength.sum": {
	"value": 19288.0,
	"min": 7992.0,
	"max": 28552.0,
	"count": 600
	},
	"SoccerTwos.Self-play.ELO.mean": {
	"value": 1567.3846019546936,
	"min": 1189.3936508408033,
	"max": 1583.8063739193924,
	"count": 593
	},
	"SoccerTwos.Self-play.ELO.sum": {
	"value": 338555.0740222138,
	"min": 2390.508945079749,
	"max": 384263.7276774414,
	"count": 593
	},
	"SoccerTwos.Step.mean": {
	"value": 5999832.0,
	"min": 9830.0,
	"max": 5999832.0,
	"count": 600
	},
	"SoccerTwos.Step.sum": {
	"value": 5999832.0,
	"min": 9830.0,
	"max": 5999832.0,
	"count": 600
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.mean": {
	"value": -0.03408787399530411,
	"min": -0.10397680848836899,
	"max": 0.14669004082679749,
	"count": 600
	},
	"SoccerTwos.Policy.ExtrinsicBaselineEstimate.sum": {
	"value": -7.362980842590332,
	"min": -21.915634155273438,
	"max": 28.4429931640625,
	"count": 600
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.mean": {
	"value": -0.03417100012302399,
	"min": -0.10394182801246643,
	"max": 0.1544579714536667,
	"count": 600
	},
	"SoccerTwos.Policy.ExtrinsicValueEstimate.sum": {
	"value": -7.3809356689453125,
	"min": -22.031593322753906,
	"max": 30.658737182617188,
	"count": 600
	},
	"SoccerTwos.Environment.CumulativeReward.mean": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 600
	},
	"SoccerTwos.Environment.CumulativeReward.sum": {
	"value": 0.0,
	"min": 0.0,
	"max": 0.0,
	"count": 600
	},
	"SoccerTwos.Policy.ExtrinsicReward.mean": {
	"value": 0.023190740357946465,
	"min": -0.6257176469354069,
	"max": 0.5128818249160593,
	"count": 600
	},
	"SoccerTwos.Policy.ExtrinsicReward.sum": {
	"value": 5.009199917316437,
	"min": -61.58959984779358,
	"max": 63.226799964904785,
	"count": 600
	},
	"SoccerTwos.Environment.GroupCumulativeReward.mean": {
	"value": 0.023190740357946465,
	"min": -0.6257176469354069,
	"max": 0.5128818249160593,
	"count": 600
	},
	"SoccerTwos.Environment.GroupCumulativeReward.sum": {
	"value": 5.009199917316437,
	"min": -61.58959984779358,
	"max": 63.226799964904785,
	"count": 600
	},
	"SoccerTwos.IsTraining.mean": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 600
	},
	"SoccerTwos.IsTraining.sum": {
	"value": 1.0,
	"min": 1.0,
	"max": 1.0,
	"count": 600
	},
	"SoccerTwos.Losses.PolicyLoss.mean": {
	"value": 0.01506537000774794,
	"min": 0.009937849570997059,
	"max": 0.02400178289390169,
	"count": 289
	},
	"SoccerTwos.Losses.PolicyLoss.sum": {
	"value": 0.01506537000774794,
	"min": 0.009937849570997059,
	"max": 0.02400178289390169,
	"count": 289
	},
	"SoccerTwos.Losses.ValueLoss.mean": {
	"value": 0.13020551279187204,
	"min": 5.6926707899644194e-05,
	"max": 0.13434325406948724,
	"count": 289
	},
	"SoccerTwos.Losses.ValueLoss.sum": {
	"value": 0.13020551279187204,
	"min": 5.6926707899644194e-05,
	"max": 0.13434325406948724,
	"count": 289
	},
	"SoccerTwos.Losses.BaselineLoss.mean": {
	"value": 0.1305543358127276,
	"min": 6.166132200936166e-05,
	"max": 0.13478971819082897,
	"count": 289
	},
	"SoccerTwos.Losses.BaselineLoss.sum": {
	"value": 0.1305543358127276,
	"min": 6.166132200936166e-05,
	"max": 0.13478971819082897,
	"count": 289
	},
	"SoccerTwos.Policy.LearningRate.mean": {
	"value": 7.292997569333412e-07,
	"min": 7.292997569333412e-07,
	"max": 0.0002986438004520667,
	"count": 289
	},
	"SoccerTwos.Policy.LearningRate.sum": {
	"value": 7.292997569333412e-07,
	"min": 7.292997569333412e-07,
	"max": 0.0002986438004520667,
	"count": 289
	},
	"SoccerTwos.Policy.Epsilon.mean": {
	"value": 0.10024306666666669,
	"min": 0.10024306666666669,
	"max": 0.19954793333333332,
	"count": 289
	},
	"SoccerTwos.Policy.Epsilon.sum": {
	"value": 0.10024306666666669,
	"min": 0.10024306666666669,
	"max": 0.19954793333333332,
	"count": 289
	},
	"SoccerTwos.Policy.Beta.mean": {
	"value": 2.212902666666679e-05,
	"min": 2.212902666666679e-05,
	"max": 0.004977441873333331,
	"count": 289
	},
	"SoccerTwos.Policy.Beta.sum": {
	"value": 2.212902666666679e-05,
	"min": 2.212902666666679e-05,
	"max": 0.004977441873333331,
	"count": 289
	}
	},
	"metadata": {
	"timer_format_version": "0.1.0",
	"start_time_seconds": "1679178285",
	"python_version": "3.9.16 (main, Mar 8 2023, 14:00:05) \n[GCC 11.2.0]",
	"command_line_arguments": "/home/hrcesur/miniconda3/envs/rl/bin/mlagents-learn ./config/poca/SoccerTwos.yaml --env=./training-envs-executables/SoccerTwos/SoccerTwos.x86_64 --run-id=SoccerTwos --no-graphics --force",
	"mlagents_version": "0.31.0.dev0",
	"mlagents_envs_version": "0.31.0.dev0",
	"communication_protocol_version": "1.5.0",
	"pytorch_version": "1.11.0+cu102",
	"numpy_version": "1.21.2",
	"end_time_seconds": "1679209314"
	},
	"total": 31029.345825880002,
	"count": 1,
	"self": 0.47647523500199895,
	"children": {
	"run_training.setup": {
	"total": 0.017039080999893486,
	"count": 1,
	"self": 0.017039080999893486
	},
	"TrainerController.start_learning": {
	"total": 31028.852311564,
	"count": 1,
	"self": 11.62543190283759,
	"children": {
	"TrainerController._reset_env": {
	"total": 2.5118212519960252,
	"count": 30,
	"self": 2.5118212519960252
	},
	"TrainerController.advance": {
	"total": 31014.421411322168,
	"count": 415474,
	"self": 11.537319528641092,
	"children": {
	"env_step": {
	"total": 10265.694971100384,
	"count": 415474,
	"self": 7897.8433287695425,
	"children": {
	"SubprocessEnvManager._take_step": {
	"total": 2360.7215402472243,
	"count": 415474,
	"self": 80.8951467904476,
	"children": {
	"TorchPolicy.evaluate": {
	"total": 2279.8263934567767,
	"count": 754736,
	"self": 2279.8263934567767
	}
	}
	},
	"workers": {
	"total": 7.1301020836169755,
	"count": 415474,
	"self": 0.0,
	"children": {
	"worker_root": {
	"total": 31011.036387888747,
	"count": 415474,
	"is_parallel": true,
	"self": 24600.084445694643,
	"children": {
	"run_training.setup": {
	"total": 0.0,
	"count": 0,
	"is_parallel": true,
	"self": 0.0,
	"children": {
	"steps_from_proto": {
	"total": 0.0054780430002665526,
	"count": 2,
	"is_parallel": true,
	"self": 0.0017358640002385073,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.0037421790000280453,
	"count": 8,
	"is_parallel": true,
	"self": 0.0037421790000280453
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 0.03557804899992334,
	"count": 1,
	"is_parallel": true,
	"self": 0.0014585970000098314,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 0.0016622109999389068,
	"count": 1,
	"is_parallel": true,
	"self": 0.0016622109999389068
	},
	"communicator.exchange": {
	"total": 0.028263499999866326,
	"count": 1,
	"is_parallel": true,
	"self": 0.028263499999866326
	},
	"steps_from_proto": {
	"total": 0.004193741000108275,
	"count": 2,
	"is_parallel": true,
	"self": 0.0008658380002088961,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.003327902999899379,
	"count": 8,
	"is_parallel": true,
	"self": 0.003327902999899379
	}
	}
	}
	}
	}
	}
	},
	"UnityEnvironment.step": {
	"total": 6410.838686295098,
	"count": 415473,
	"is_parallel": true,
	"self": 379.25663072938187,
	"children": {
	"UnityEnvironment._generate_step_input": {
	"total": 374.063670495638,
	"count": 415473,
	"is_parallel": true,
	"self": 374.063670495638
	},
	"communicator.exchange": {
	"total": 4562.090233859916,
	"count": 415473,
	"is_parallel": true,
	"self": 4562.090233859916
	},
	"steps_from_proto": {
	"total": 1095.4281512101627,
	"count": 830946,
	"is_parallel": true,
	"self": 240.53099280302786,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 854.8971584071348,
	"count": 3323784,
	"is_parallel": true,
	"self": 854.8971584071348
	}
	}
	}
	}
	},
	"steps_from_proto": {
	"total": 0.11325589900388877,
	"count": 58,
	"is_parallel": true,
	"self": 0.024725750999550655,
	"children": {
	"_process_rank_one_or_two_observation": {
	"total": 0.08853014800433812,
	"count": 232,
	"is_parallel": true,
	"self": 0.08853014800433812
	}
	}
	}
	}
	}
	}
	}
	}
	},
	"trainer_advance": {
	"total": 20737.189120693143,
	"count": 415474,
	"self": 76.80797019366219,
	"children": {
	"process_trajectory": {
	"total": 3242.5880062994315,
	"count": 415474,
	"self": 3238.925574678427,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 3.6624316210045436,
	"count": 12,
	"self": 3.6624316210045436
	}
	}
	},
	"_update_policy": {
	"total": 17417.793144200048,
	"count": 289,
	"self": 1486.0706528033752,
	"children": {
	"TorchPOCAOptimizer.update": {
	"total": 15931.722491396673,
	"count": 8685,
	"self": 15931.722491396673
	}
	}
	}
	}
	}
	}
	},
	"trainer_threads": {
	"total": 1.1779993656091392e-06,
	"count": 1,
	"self": 1.1779993656091392e-06
	},
	"TrainerController._save_models": {
	"total": 0.2936459089978598,
	"count": 1,
	"self": 0.002132837998942705,
	"children": {
	"RLTrainer._checkpoint": {
	"total": 0.2915130709989171,
	"count": 1,
	"self": 0.2915130709989171
	}
	}
	}
	}
	}
	}
	}