diff --git a/environments/ai_vs_ai/ml-agents b/environments/ai_vs_ai/ml-agents --- a/environments/ai_vs_ai/ml-agents +++ b/environments/ai_vs_ai/ml-agents @@ -1 +1 @@ -Subproject commit 8bcedabd808ffb7097f88b800fc92dea82dfd610 +Subproject commit 8bcedabd808ffb7097f88b800fc92dea82dfd610-dirty diff --git a/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/0.monitor.csv b/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/0.monitor.csv index fb7057b..022e9b0 100644 --- a/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/0.monitor.csv +++ b/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/0.monitor.csv @@ -32220,3 +32220,7 @@ r,l,t 23050.0,10155,310929.782787 26000.0,11454,310943.878619 26325.0,12759,310959.764965 +15300.0,6347,310967.628622 +22950.0,11642,311015.595944 +15500.0,6612,311023.793262 +23025.0,10637,311037.115804 diff --git a/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/evaluations.npz b/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/evaluations.npz index 19b694c..3fe84a2 100644 Binary files a/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/evaluations.npz and b/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/evaluations.npz differ diff --git a/environments/sample_factory/doom_deathmatch.ipynb b/environments/sample_factory/doom_deathmatch.ipynb index 89dfc80..3d4554e 100644 --- a/environments/sample_factory/doom_deathmatch.ipynb +++ b/environments/sample_factory/doom_deathmatch.ipynb @@ -11,21 +11,112 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": 11, "metadata": {}, "outputs": [], "source": [ "import wandb\n", - "api = wandb.Api()\n", + "# api = wandb.Api()\n", "\n", - "run = api.run(\"matt-stammers/sample_factory/default_experiment_20230912_141858_570479\")\n", - "run.config[\"key\"] = \"default_experiment_deathmatch\"\n", - "run.update()" + "# run = api.run(\"matt-stammers/sample_factory/default_experiment_20230912_141858_570479\")\n", + "# run.config[\"key\"] = \"d753dcfca676efc5aee0dc806595b8d938c17e44\"\n", + "# run.update()" + ] + }, + { + "cell_type": "code", + "execution_count": 13, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "Failed to detect the name of this notebook, you can set it manually with the WANDB_NOTEBOOK_NAME environment variable to enable code saving.\n", + "\u001b[34m\u001b[1mwandb\u001b[0m: Currently logged in as: \u001b[33mmatt-stammers\u001b[0m. Use \u001b[1m`wandb login --relogin`\u001b[0m to force relogin\n" + ] + }, + { + "data": { + "text/html": [ + "Tracking run with wandb version 0.15.10" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "Run data is saved locally in /home/cogstack/Documents/optuna/environments/sample_factory/wandb/run-20230914_123945-f2heddj4" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "Syncing run comfy-salad-1 to Weights & Biases (docs)
" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + " View project at https://wandb.ai/matt-stammers/Doom_Duel" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + " View run at https://wandb.ai/matt-stammers/Doom_Duel/runs/f2heddj4" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "" + ], + "text/plain": [ + "" + ] + }, + "execution_count": 13, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "wandb.init(project=\"Doom_Duel\")" ] }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 3, "metadata": {}, "outputs": [], "source": [ @@ -73,60 +164,59 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 12, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ - "\u001b[33m[2023-09-12 21:01:43,594][28625] Environment doom_basic already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,596][28625] Environment doom_two_colors_easy already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,599][28625] Environment doom_two_colors_hard already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,601][28625] Environment doom_dm already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,603][28625] Environment doom_dwango5 already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,604][28625] Environment doom_my_way_home_flat_actions already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,605][28625] Environment doom_defend_the_center_flat_actions already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,606][28625] Environment doom_my_way_home already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,607][28625] Environment doom_deadly_corridor already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,608][28625] Environment doom_defend_the_center already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,610][28625] Environment doom_defend_the_line already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,611][28625] Environment doom_health_gathering already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,613][28625] Environment doom_health_gathering_supreme already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,613][28625] Environment doom_battle already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,614][28625] Environment doom_battle2 already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,614][28625] Environment doom_duel_bots already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,615][28625] Environment doom_deathmatch_bots already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,616][28625] Environment doom_duel already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,616][28625] Environment doom_deathmatch_full already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,617][28625] Environment doom_benchmark already registered, overwriting...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:43,617][28625] register_encoder_factory: \u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,646][28625] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:43,650][28625] Overriding arg 'train_for_env_steps' with value 1000000 passed from command line\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:43,659][28625] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:43,661][28625] Resuming existing experiment from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:43,661][28625] Weights and Biases integration disabled\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:43,664][28625] Environment var CUDA_VISIBLE_DEVICES is 0,1\n", + "\u001b[33m[2023-09-14 12:37:01,572][109198] Environment doom_basic already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,574][109198] Environment doom_two_colors_easy already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,576][109198] Environment doom_two_colors_hard already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,577][109198] Environment doom_dm already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,579][109198] Environment doom_dwango5 already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,580][109198] Environment doom_my_way_home_flat_actions already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,581][109198] Environment doom_defend_the_center_flat_actions already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,582][109198] Environment doom_my_way_home already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,583][109198] Environment doom_deadly_corridor already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,584][109198] Environment doom_defend_the_center already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,585][109198] Environment doom_defend_the_line already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,585][109198] Environment doom_health_gathering already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,586][109198] Environment doom_health_gathering_supreme already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,586][109198] Environment doom_battle already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,587][109198] Environment doom_battle2 already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,588][109198] Environment doom_duel_bots already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,588][109198] Environment doom_deathmatch_bots already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,589][109198] Environment doom_duel already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,589][109198] Environment doom_deathmatch_full already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,590][109198] Environment doom_benchmark already registered, overwriting...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:01,591][109198] register_encoder_factory: \u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:01,613][109198] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:01,614][109198] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:01,615][109198] Resuming existing experiment from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:01,616][109198] Weights and Biases integration disabled\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:01,619][109198] Environment var CUDA_VISIBLE_DEVICES is 0,1\n", "\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:45,348][39338] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:45,376][39338] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,168][74776] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,196][74776] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.num_agents to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.num_agents` for environment variables or `env.get_wrapper_attr('num_agents')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.is_multiagent to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.is_multiagent` for environment variables or `env.get_wrapper_attr('is_multiagent')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[36m[2023-09-12 21:01:45,378][39338] Env info: EnvInfo(obs_space=Dict('measurements': Box([ 0. 0. -1. -1. -50. 0. 0. 0. 0. 0. 0. 0. 0. 0.\n", + "\u001b[36m[2023-09-14 12:37:03,198][74776] Env info: EnvInfo(obs_space=Dict('measurements': Box([ 0. 0. -1. -1. -50. 0. 0. 0. 0. 0. 0. 0. 0. 0.\n", " 0. 0. 0. 0. 0. 0. 0. 0. 0.], [20. 50. 50. 50. 50. 1. 10. 5. 5. 5. 5. 5. 5. 5. 5. 50. 50. 50.\n", - " 50. 50. 50. 50. 50.], (23,), float32), 'obs': Box(0, 255, (3, 72, 128), uint8)), action_space=Tuple(Discrete(3), Discrete(3), Discrete(3), Discrete(2), Discrete(2), Box(-1.0, 1.0, (1,), float32)), num_agents=8, gpu_actions=False, gpu_observations=True, action_splits=[1, 1, 1, 1, 1, 1], all_discrete=False, frameskip=4, reward_shaping_scheme={'delta': {'FRAGCOUNT': (1, -0.001), 'DEATHCOUNT': (-1, 1), 'HITCOUNT': (0, 0), 'DAMAGECOUNT': (0.01, -0.01), 'HEALTH': (0.01, -0.01), 'ARMOR': (0.005, -0.001), 'WEAPON0': (0.02, -0.01), 'AMMO0': (0.0002, -0.0001), 'WEAPON1': (0.02, -0.01), 'AMMO1': (0.0002, -0.0001), 'WEAPON2': (0.02, -0.01), 'AMMO2': (0.0002, -0.0001), 'WEAPON3': (0.1, -0.05), 'AMMO3': (0.001, -0.0005), 'WEAPON4': (0.1, -0.05), 'AMMO4': (0.001, -0.0005), 'WEAPON5': (0.1, -0.05), 'AMMO5': (0.001, -0.0005), 'WEAPON6': (0.2, -0.1), 'AMMO6': (0.002, -0.001), 'WEAPON7': (0.2, -0.1), 'AMMO7': (0.002, -0.001)}, 'selected_weapon': {'SELECTED0': 0.0002, 'SELECTED1': 0.0002, 'SELECTED2': 0.0002, 'SELECTED3': 0.001, 'SELECTED4': 0.001, 'SELECTED5': 0.001, 'SELECTED6': 0.002, 'SELECTED7': 0.002}}, env_info_protocol_version=1)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:45,745][28625] Starting experiment with the following configuration:\n", + " 50. 50. 50. 50. 50.], (23,), float32), 'obs': Box(0, 255, (3, 72, 128), uint8)), action_space=Tuple(Discrete(3), Discrete(3), Discrete(8), Discrete(2), Discrete(2), Discrete(2), Discrete(21)), num_agents=2, gpu_actions=False, gpu_observations=True, action_splits=[1, 1, 1, 1, 1, 1, 1], all_discrete=True, frameskip=4, reward_shaping_scheme={'delta': {'FRAGCOUNT': (1, -0.001), 'DEATHCOUNT': (-1, 1), 'HITCOUNT': (0, 0), 'DAMAGECOUNT': (0.01, -0.01), 'HEALTH': (0.01, -0.01), 'ARMOR': (0.005, -0.001), 'WEAPON0': (0.02, -0.01), 'AMMO0': (0.0002, -0.0001), 'WEAPON1': (0.02, -0.01), 'AMMO1': (0.0002, -0.0001), 'WEAPON2': (0.02, -0.01), 'AMMO2': (0.0002, -0.0001), 'WEAPON3': (0.1, -0.05), 'AMMO3': (0.001, -0.0005), 'WEAPON4': (0.1, -0.05), 'AMMO4': (0.001, -0.0005), 'WEAPON5': (0.1, -0.05), 'AMMO5': (0.001, -0.0005), 'WEAPON6': (0.2, -0.1), 'AMMO6': (0.002, -0.001), 'WEAPON7': (0.2, -0.1), 'AMMO7': (0.002, -0.001)}, 'selected_weapon': {'SELECTED0': 0.0002, 'SELECTED1': 0.0002, 'SELECTED2': 0.0002, 'SELECTED3': 0.001, 'SELECTED4': 0.001, 'SELECTED5': 0.001, 'SELECTED6': 0.002, 'SELECTED7': 0.002}}, env_info_protocol_version=1)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,541][109198] Starting experiment with the following configuration:\n", "help=False\n", "algo=APPO\n", - "env=doom_dwango5\n", + "env=doom_duel\n", "experiment=default_experiment\n", "train_dir=/home/cogstack/Documents/optuna/environments/sample_factory/train_dir\n", "restart_behavior=resume\n", "device=gpu\n", "seed=None\n", - "num_policies=1\n", + "num_policies=2\n", "async_rl=True\n", "serial_mode=False\n", "batched_sampling=False\n", @@ -184,7 +274,7 @@ "summaries_use_frameskip=True\n", "heartbeat_interval=20\n", "heartbeat_reporting_interval=600\n", - "train_for_env_steps=1000000\n", + "train_for_env_steps=10000000\n", "train_for_seconds=10000000000\n", "save_every_sec=120\n", "keep_checkpoints=2\n", @@ -248,44 +338,117 @@ "cli_args={'env': 'doom_dm', 'num_workers': 8, 'num_envs_per_worker': 4, 'train_for_env_steps': 20000000}\n", "git_hash=20b6d44612dad7d171f23e13b1f3b4c5e5631cf9\n", "git_repo_name=https://github.com/MattStammers/optuna.git\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:45,747][28625] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,757][28625] Rollout worker 0 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,758][28625] Rollout worker 1 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,760][28625] Rollout worker 2 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,761][28625] Rollout worker 3 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,763][28625] Rollout worker 4 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,765][28625] Rollout worker 5 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,767][28625] Rollout worker 6 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,768][28625] Rollout worker 7 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,937][28625] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:46,939][28625] InferenceWorker_p0-w0: min num requests: 2\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,973][28625] Starting all processes...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,974][28625] Starting process learner_proc0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,713][28625] Starting all processes...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:48,713][39537] LearnerWorker_p0\tpid 39537\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,714][39537] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:48,714][39537] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,719][28625] Starting process inference_proc0-0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,719][28625] Starting process rollout_proc0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,720][28625] Starting process rollout_proc1\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,720][28625] Starting process rollout_proc2\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,725][28625] Starting process rollout_proc3\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,725][28625] Starting process rollout_proc4\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,725][28625] Starting process rollout_proc5\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,759][39537] Num visible devices: 1\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,726][28625] Starting process rollout_proc6\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,726][28625] Starting process rollout_proc7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:48,796][39537] Starting seed is not provided\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,797][39537] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,797][39537] Initializing actor-critic model on device cuda:0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,797][39537] RunningMeanStd input shape: (23,)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,798][39537] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,798][39537] RunningMeanStd input shape: (1,)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,810][39537] ConvEncoder: input_channels=3\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,954][39537] Conv encoder output size: 512\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,956][39537] Policy head output size: 640\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,984][39537] Created Actor Critic model with architecture:\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,986][39537] ActorCriticSharedWeights(\n", + "\u001b[36m[2023-09-14 12:37:03,543][109198] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,663][109198] Rollout worker 0 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,664][109198] Rollout worker 1 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,665][109198] Rollout worker 2 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,667][109198] Rollout worker 3 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,669][109198] Rollout worker 4 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,671][109198] Rollout worker 5 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,672][109198] Rollout worker 6 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,673][109198] Rollout worker 7 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,747][109198] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:03,748][109198] InferenceWorker_p0-w0: min num requests: 1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,753][109198] Using GPUs [1] for process 1 (actually maps to GPUs [1])\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:03,754][109198] InferenceWorker_p1-w0: min num requests: 1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,790][109198] Starting all processes...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:03,792][109198] Starting process learner_proc0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:05,393][109198] Starting process learner_proc1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:05,395][74942] LearnerWorker_p0\tpid 74942\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:05,395][74942] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:05,396][74942] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:05,434][74942] Num visible devices: 1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:05,475][74942] Starting seed is not provided\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:05,475][74942] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:05,476][74942] Initializing actor-critic model on device cuda:0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:05,476][74942] RunningMeanStd input shape: (23,)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:05,476][74942] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:05,477][74942] RunningMeanStd input shape: (1,)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:05,488][74942] ConvEncoder: input_channels=3\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:05,599][74942] Conv encoder output size: 512\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:05,600][74942] Policy head output size: 640\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:05,618][74942] Created Actor Critic model with architecture:\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:05,618][74942] ActorCriticSharedWeights(\n", + " (obs_normalizer): ObservationNormalizer(\n", + " (running_mean_std): RunningMeanStdDictInPlace(\n", + " (running_mean_std): ModuleDict(\n", + " (measurements): RunningMeanStdInPlace()\n", + " (obs): RunningMeanStdInPlace()\n", + " )\n", + " )\n", + " )\n", + " (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace)\n", + " (encoder): VizdoomEncoder(\n", + " (basic_encoder): ConvEncoder(\n", + " (enc): RecursiveScriptModule(\n", + " original_name=ConvEncoderImpl\n", + " (conv_head): RecursiveScriptModule(\n", + " original_name=Sequential\n", + " (0): RecursiveScriptModule(original_name=Conv2d)\n", + " (1): RecursiveScriptModule(original_name=ELU)\n", + " (2): RecursiveScriptModule(original_name=Conv2d)\n", + " (3): RecursiveScriptModule(original_name=ELU)\n", + " (4): RecursiveScriptModule(original_name=Conv2d)\n", + " (5): RecursiveScriptModule(original_name=ELU)\n", + " )\n", + " (mlp_layers): RecursiveScriptModule(\n", + " original_name=Sequential\n", + " (0): RecursiveScriptModule(original_name=Linear)\n", + " (1): RecursiveScriptModule(original_name=ELU)\n", + " )\n", + " )\n", + " )\n", + " (measurements_head): Sequential(\n", + " (0): Linear(in_features=23, out_features=128, bias=True)\n", + " (1): ELU(alpha=1.0)\n", + " (2): Linear(in_features=128, out_features=128, bias=True)\n", + " (3): ELU(alpha=1.0)\n", + " )\n", + " )\n", + " (core): ModelCoreRNN(\n", + " (core): GRU(640, 512)\n", + " )\n", + " (decoder): MlpDecoder(\n", + " (mlp): Identity()\n", + " )\n", + " (critic_linear): Linear(in_features=512, out_features=1, bias=True)\n", + " (action_parameterization): ActionParameterizationDefault(\n", + " (distribution_linear): Linear(in_features=512, out_features=41, bias=True)\n", + " )\n", + ")\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:06,503][74942] Using optimizer \u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:06,504][74942] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001187_4861952.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:06,529][74942] Loading model from checkpoint\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:06,534][74942] Loaded experiment state at self.train_step=1187, self.env_steps=4861952\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:06,535][74942] Initialized policy 0 weights for model version 1187\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:06,536][74942] LearnerWorker_p0 finished initialization!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:06,537][74942] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,035][109198] Starting all processes...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:07,036][75052] LearnerWorker_p1\tpid 75052\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,036][75052] Using GPUs [1] for process 1 (actually maps to GPUs [1])\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:07,037][75052] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for learning process 1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,041][109198] Starting process inference_proc0-0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,042][109198] Starting process inference_proc1-0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,043][109198] Starting process rollout_proc0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,043][109198] Starting process rollout_proc1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,044][109198] Starting process rollout_proc2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,045][109198] Starting process rollout_proc3\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,045][109198] Starting process rollout_proc4\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,073][75052] Num visible devices: 1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,046][109198] Starting process rollout_proc5\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,047][109198] Starting process rollout_proc6\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,048][109198] Starting process rollout_proc7\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:07,119][75052] Starting seed is not provided\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,119][75052] Using GPUs [0] for process 1 (actually maps to GPUs [1])\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,120][75052] Initializing actor-critic model on device cuda:0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,120][75052] RunningMeanStd input shape: (23,)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,121][75052] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,121][75052] RunningMeanStd input shape: (1,)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,140][75052] ConvEncoder: input_channels=3\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,369][75052] Conv encoder output size: 512\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,370][75052] Policy head output size: 640\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,400][75052] Created Actor Critic model with architecture:\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:07,400][75052] ActorCriticSharedWeights(\n", " (obs_normalizer): ObservationNormalizer(\n", " (running_mean_std): RunningMeanStdDictInPlace(\n", " (running_mean_std): ModuleDict(\n", @@ -330,6694 +493,1819 @@ " )\n", " (critic_linear): Linear(in_features=512, out_features=1, bias=True)\n", " (action_parameterization): ActionParameterizationDefault(\n", - " (distribution_linear): Linear(in_features=512, out_features=15, bias=True)\n", + " (distribution_linear): Linear(in_features=512, out_features=41, bias=True)\n", " )\n", ")\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,408][39537] Using optimizer \u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:50,409][39537] No checkpoints found\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,409][39537] Did not load from checkpoint, starting from scratch!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,409][39537] Initialized policy 0 weights for model version 0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,412][39537] LearnerWorker_p0 finished initialization!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,412][39537] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,709][39685] Rollout worker 0 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,709][39685] ROLLOUT worker 0\tpid 39685\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,710][39685] Worker 0 uses CPU cores [0, 1, 2, 3]\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,780][39698] Rollout worker 3 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,780][39698] ROLLOUT worker 3\tpid 39698\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,780][39698] Worker 3 uses CPU cores [12, 13, 14, 15]\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,818][39731] Rollout worker 4 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,818][39731] ROLLOUT worker 4\tpid 39731\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,819][39731] Worker 4 uses CPU cores [16, 17, 18, 19]\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,855][39734] Rollout worker 7 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,855][39734] ROLLOUT worker 7\tpid 39734\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,857][39734] Worker 7 uses CPU cores [28, 29, 30, 31]\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,880][39699] Rollout worker 5 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,880][39699] ROLLOUT worker 5\tpid 39699\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,881][39699] Worker 5 uses CPU cores [20, 21, 22, 23]\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,915][39686] InferenceWorker_p0-w0\tpid 39686\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,915][39686] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,915][39686] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,927][39696] Rollout worker 2 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,927][39696] ROLLOUT worker 2\tpid 39696\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,931][39696] Worker 2 uses CPU cores [8, 9, 10, 11]\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,954][39686] Num visible devices: 1\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,991][39733] Rollout worker 6 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,991][39733] ROLLOUT worker 6\tpid 39733\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,992][39733] Worker 6 uses CPU cores [24, 25, 26, 27]\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,090][39697] Rollout worker 1 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:51,090][39697] ROLLOUT worker 1\tpid 39697\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,090][39697] Worker 1 uses CPU cores [4, 5, 6, 7]\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,618][39686] RunningMeanStd input shape: (23,)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,618][39686] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,618][39686] RunningMeanStd input shape: (1,)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,630][39686] ConvEncoder: input_channels=3\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,739][39686] Conv encoder output size: 512\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,740][39686] Policy head output size: 640\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,083][28625] Inference worker 0-0 is ready!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,085][28625] All inference workers are ready! Signal rollout workers to start!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,088][39685] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,090][39698] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,091][39734] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,092][39696] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,092][39699] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,092][39697] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,093][39731] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,094][39733] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,118][39685] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,121][39685] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,124][39734] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,125][39697] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,125][39699] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,126][39696] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,127][39731] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,128][39734] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,129][39697] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,129][39699] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,129][39696] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,130][39731] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,134][39698] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,139][39733] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,139][39698] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,143][39733] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,151][39685] Port 40300 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,151][39685] Using port 40300\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,152][39685] Initializing env for player 0, init_info: {'port': 40300}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,160][39697] Port 40400 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,160][39697] Using port 40400\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,161][39696] Port 40500 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,161][39699] Port 40800 is available\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,161][39697] Initializing env for player 0, init_info: {'port': 40400}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,161][39696] Using port 40500\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,161][39699] Using port 40800\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,161][39734] Port 41000 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,161][39734] Using port 41000\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,162][39696] Initializing env for player 0, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,162][39699] Initializing env for player 0, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,163][39734] Initializing env for player 0, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,176][39733] Port 40900 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,176][39733] Using port 40900\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,177][39733] Initializing env for player 0, init_info: {'port': 40900}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:08,655][75052] Using optimizer \u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:08,656][75052] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000481_1970176.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:08,685][75052] Loading model from checkpoint\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:08,690][75052] Loaded experiment state at self.train_step=481, self.env_steps=1970176\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:08,691][75052] Initialized policy 1 weights for model version 481\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:08,693][75052] LearnerWorker_p1 finished initialization!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:08,693][75052] Using GPUs [0] for process 1 (actually maps to GPUs [1])\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:08,972][75218] Rollout worker 3 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:08,972][75218] ROLLOUT worker 3\tpid 75218\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:08,973][75218] Worker 3 uses CPU cores [12, 13, 14, 15]\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,066][75219] Rollout worker 4 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:09,067][75219] ROLLOUT worker 4\tpid 75219\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,067][75219] Worker 4 uses CPU cores [16, 17, 18, 19]\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,074][75215] Rollout worker 1 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:09,074][75215] ROLLOUT worker 1\tpid 75215\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,075][75215] Worker 1 uses CPU cores [4, 5, 6, 7]\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,076][75217] Rollout worker 2 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:09,077][75217] ROLLOUT worker 2\tpid 75217\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,077][75217] Worker 2 uses CPU cores [8, 9, 10, 11]\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,321][75216] Rollout worker 0 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:09,321][75216] ROLLOUT worker 0\tpid 75216\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,323][75216] Worker 0 uses CPU cores [0, 1, 2, 3]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:09,473][75209] InferenceWorker_p1-w0\tpid 75209\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,474][75209] Using GPUs [1] for process 1 (actually maps to GPUs [1])\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:09,474][75209] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for inference process 1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,491][75209] Num visible devices: 1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,615][75254] Rollout worker 7 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:09,615][75254] ROLLOUT worker 7\tpid 75254\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,616][75254] Worker 7 uses CPU cores [28, 29, 30, 31]\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,659][75252] Rollout worker 5 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:09,659][75252] ROLLOUT worker 5\tpid 75252\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,660][75252] Worker 5 uses CPU cores [20, 21, 22, 23]\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,684][75253] Rollout worker 6 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:09,684][75253] ROLLOUT worker 6\tpid 75253\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,685][75253] Worker 6 uses CPU cores [24, 25, 26, 27]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:09,698][75214] InferenceWorker_p0-w0\tpid 75214\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,699][75214] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:09,699][75214] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:09,718][75214] Num visible devices: 1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,169][75209] RunningMeanStd input shape: (23,)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,170][75209] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,170][75209] RunningMeanStd input shape: (1,)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,182][75209] ConvEncoder: input_channels=3\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,286][75209] Conv encoder output size: 512\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,287][75209] Policy head output size: 640\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,315][75214] RunningMeanStd input shape: (23,)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,315][75214] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,316][75214] RunningMeanStd input shape: (1,)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,327][75214] ConvEncoder: input_channels=3\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,435][75214] Conv encoder output size: 512\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,436][75214] Policy head output size: 640\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,565][109198] Inference worker 1-0 is ready!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,723][109198] Inference worker 0-0 is ready!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,724][109198] All inference workers are ready! Signal rollout workers to start!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,729][75218] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,729][75219] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,729][75215] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,730][75252] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,731][75216] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,732][75217] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,732][75254] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,733][75253] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,764][75218] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,765][75216] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,768][75216] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,769][75218] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,769][75252] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,772][75217] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,772][75252] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,774][75254] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,775][75217] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,775][75253] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,776][75215] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,776][75219] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,778][75254] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,779][75253] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,780][75215] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,780][75219] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,807][75217] Port 40500 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,807][75252] Port 40800 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,807][75216] Port 40300 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,807][75217] Using port 40500\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,807][75252] Using port 40800\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,807][75216] Using port 40300\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,808][75217] Initializing env for player 0, init_info: {'port': 40500}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,808][75252] Initializing env for player 0, init_info: {'port': 40800}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,808][75216] Initializing env for player 0, init_info: {'port': 40300}...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:10,810][75254] UDP port 41000 cannot be used [Errno 98] Address already in use\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,810][75254] Port 42000 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,811][75254] Using port 42000\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,813][75254] Initializing env for player 0, init_info: {'port': 42000}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,814][75218] Port 40600 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,814][75218] Using port 40600\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,815][75218] Initializing env for player 0, init_info: {'port': 40600}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,825][75253] Port 40900 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,825][75253] Using port 40900\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,826][75215] Port 40400 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,826][75215] Using port 40400\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,826][75253] Initializing env for player 0, init_info: {'port': 40900}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,826][75219] Port 40700 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:10,827][75219] Using port 40700\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,827][75215] Initializing env for player 0, init_info: {'port': 40400}...\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,185][39685] Using port 40300 on host...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,186][39698] Port 40600 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,186][39698] Using port 40600\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,187][39698] Initializing env for player 0, init_info: {'port': 40600}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,837][75217] Using port 40500 on host...\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,193][39734] Using port 41000 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,841][75254] Using port 42000 on host...\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,195][39696] Using port 40500 on host...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,197][39731] Port 40700 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,197][39731] Using port 40700\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,202][39685] Initializing env for player 1, init_info: {'port': 40300}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,843][75216] Using port 40300 on host...\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,207][39733] Using port 40900 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,849][75218] Using port 40600 on host...\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,209][39697] Using port 40400 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,854][75252] Using port 40800 on host...\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,210][39699] Using port 40800 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,212][39696] Initializing env for player 1, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,214][39734] Initializing env for player 1, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,217][39699] Initializing env for player 1, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,219][39697] Initializing env for player 1, init_info: {'port': 40400}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,855][75253] Using port 40900 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,858][75217] Initializing env for player 1, init_info: {'port': 40500}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,858][75216] Initializing env for player 1, init_info: {'port': 40300}...\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,229][39733] Initializing env for player 1, init_info: {'port': 40900}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,229][39698] Using port 40600 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,238][39698] Initializing env for player 1, init_info: {'port': 40600}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,253][39685] Initializing env for player 2, init_info: {'port': 40300}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,263][39696] Initializing env for player 2, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,264][39734] Initializing env for player 2, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,267][39699] Initializing env for player 2, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,274][39697] Initializing env for player 2, init_info: {'port': 40400}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,279][39733] Initializing env for player 2, init_info: {'port': 40900}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,291][39698] Initializing env for player 2, init_info: {'port': 40600}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,303][39685] Initializing env for player 3, init_info: {'port': 40300}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,315][39734] Initializing env for player 3, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,321][39697] Initializing env for player 3, init_info: {'port': 40400}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,322][39696] Initializing env for player 3, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,324][39699] Initializing env for player 3, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,335][39733] Initializing env for player 3, init_info: {'port': 40900}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,341][39698] Initializing env for player 3, init_info: {'port': 40600}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,353][39685] Initializing env for player 4, init_info: {'port': 40300}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,370][39734] Initializing env for player 4, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,371][39696] Initializing env for player 4, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,371][39697] Initializing env for player 4, init_info: {'port': 40400}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,383][39733] Initializing env for player 4, init_info: {'port': 40900}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,385][39699] Initializing env for player 4, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,392][39698] Initializing env for player 4, init_info: {'port': 40600}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,404][39685] Initializing env for player 5, init_info: {'port': 40300}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,418][39696] Initializing env for player 5, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,426][39734] Initializing env for player 5, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,427][39697] Initializing env for player 5, init_info: {'port': 40400}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,431][39699] Initializing env for player 5, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,435][39733] Initializing env for player 5, init_info: {'port': 40900}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,443][39698] Initializing env for player 5, init_info: {'port': 40600}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,455][39685] Initializing env for player 6, init_info: {'port': 40300}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,475][39696] Initializing env for player 6, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,477][39699] Initializing env for player 6, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,479][39697] Initializing env for player 6, init_info: {'port': 40400}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,483][39734] Initializing env for player 6, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,485][39733] Initializing env for player 6, init_info: {'port': 40900}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,499][39698] Initializing env for player 6, init_info: {'port': 40600}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,515][39685] Initializing env for player 7, init_info: {'port': 40300}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,527][39696] Initializing env for player 7, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,535][39697] Initializing env for player 7, init_info: {'port': 40400}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,535][39734] Initializing env for player 7, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,539][39699] Initializing env for player 7, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,539][39733] Initializing env for player 7, init_info: {'port': 40900}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,551][39698] Initializing env for player 7, init_info: {'port': 40600}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,860][75215] Using port 40400 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,860][75252] Initializing env for player 1, init_info: {'port': 40800}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,863][75254] Initializing env for player 1, init_info: {'port': 42000}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,865][75218] Initializing env for player 1, init_info: {'port': 40600}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,877][75253] Initializing env for player 1, init_info: {'port': 40900}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:10,878][75215] Initializing env for player 1, init_info: {'port': 40400}...\u001b[0m\n", "Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", "Contacting host: /Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. ss 'Q' to abort network game synchronization.\n", - "Waiting for players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Contacting host: \\Press 'Q' to abort network game synchronization.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", "Contacting host: /Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", "Contacting host: /Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", "Contacting host: /Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Waiting for other players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", + "Contacting host: /Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Total players: 8 \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Waiting for other players: .... [ 4/ 8]\n", "Got connect from node 1. \n", - "Waiting for players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", + "Total players: 2 \n", + "\n", + "Waiting for other players: .. [ 2/ 2]\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Waiting for other players: ..... [ 5/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 2. \n", - "Waiting for players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", + "Waiting for other players: .. [ 2/ 2]\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", "Sending all here. \n", "\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 2. 8]\n", - "Waiting for players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", "Got connect from node 1. \n", - "Total players: 8 \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", "Got connect from node 1. \n", - "Waiting for other players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", + "Waiting for other players: .. [ 2/ 2]\n", + "Total players: 2 \n", "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: \\Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 8]\n", + "Waiting for other players: .. [ 2/ 2]\n", + "Total players: 2 \n", "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Got connect from node 3. \n", - "Waiting for players: .... [ 4/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 2 \n", + "Waiting for other players: .. [ 2/ 2]\n", + "Total players: 2 \n", + "\n", + "Waiting for other players: .. [ 2/ 2]\n", + "Total players: 2 \n", + "\n", + "Waiting for other players: .. [ 2/ 2]\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Console player number: 3 8]\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Total players: 8 \n", "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Total players: 8 8]/ 8] 8]\n", + "Go \n", + "Total players: 2 \n", "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 \n", + "Go \n", + "Total players: 2 \n", "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Got connect from node 2. \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 5 8]\n", + "Exchanging game information.\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Console player number: 6 8]\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Console player number: 4 \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Console player number: 1 8]\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Console player number: 7 \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Waiting for players: ....... [ 7/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "\n", - "Go \n", - "Total players: 8 \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 8]\n", + "Go \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", + "Exchanging game information.\n", + "Exchanging game information.\u001b[36m[2023-09-14 12:37:11,619][109198] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 6832128. Throughput: 0: nan, 1: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", - "Contacting host: -\n", - "Got connect from node 6. \n", - "Waiting for players: ....... [ 7/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", + "Total players: 2 \n", "\n", - "Total players: 8 \n", + "Go \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Got connect from node 4. 8]\n", - "Got connect from node 5. [ 5/ 8]\n", - "Got connect from node 6. 8]\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", + "Go \n", + "Total players: 2 \n", "\n", - "Total players: 8 8]\n", + "Exchanging game information.\n", + "Exchanging game information.\n", + "Exchanging game information.\n", + "Go \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", + "Go \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Total players: 8 8]\n", + "Exchanging game information.\n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", + "Received \"Go.\" \n", "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 8]\n", + "Total players: 2 \n", "\n", - "Waiting for other players: .... [ 4/ 8]\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", - "Got connect from node 6. 8]... [ 6/ 8]\n", - "Received All Here, sending ACK. 8]\n", + "Total players: 2 \n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "\n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Received All Here, sending ACK. 8]\n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Got connect from node 7. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", + "Total players: 2 \n", "\n", - "Total players: 8 \n", + "Exchanging game information.\n", + "Found AI0_host (node 1, player 1) \n", + "Found AI1 (node 1, player 2) \n", + "Found AI0_host (node 1, player 1) \n", + "Found AI1 (node 1, player 2) \n", + "Found AI0_host (node 1, player 1) \n", + "Found AI0_host (node 1, player 1) \n", + "Found AI0_host (node 1, player 1) \n", + "Found AI0_host (node 1, player 1) \n", + "Found AI0_host (node 1, player 1) \n", + "Found AI1 (node 1, player 2) \n", + "Found AI1 (node 0, player 2) \n", "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", + "Found AI1 (node 1, player 2) \n", + "Found AI1 (node 1, player 2) \n", + "Found AI1 (node 0, player 2) \n", "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 8]\n", + "Found AI1 (node 1, player 2) \n", + "Found AI1 (node 1, player 2) \n", + "Found AI1 (node 0, player 2) \n", + "Found AI1 (node 0, player 2) \n", + "Found AI1 (node 0, player 2) \n", + "Found AI1 (node 0, player 2) \n", + "Found AI1 (node 0, player 2) \n", "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 8]\n", "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", "\n", - "Found AI3 (node 2, player 3) 8]\n", - "Found AI2 (node 3, player 4) \n", - "Got connect from node 5. 8]\n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", "\n", - "Total players: 8 8]\n", "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Got connect from node 7. 8]\n", - "Waiting for players: ........ [ 8/ 8]\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:11,938][75216] Initialized w:0 v:0 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:11,941][75216] Initialized w:0 v:0 player:0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:11,941][75216] 2 agent workers initialized for env 0!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:11,948][75253] Initialized w:6 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:11,949][75253] Initialized w:6 v:0 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:11,950][75253] 2 agent workers initialized for env 6!\u001b[0m\n", + "\n", + "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:11,956][75216] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:11,957][75216] Port 40301 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:11,957][75216] Using port 40301\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:11,964][75253] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:11,965][75253] Port 40901 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:11,965][75253] Using port 40901\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:11,965][75253] Initializing env for player 0, init_info: {'port': 40901}...\u001b[0m\n", + "\n", + "\n", + "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:11,985][75252] Initialized w:5 v:0 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:11,986][75252] Initialized w:5 v:0 player:0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:11,987][75252] 2 agent workers initialized for env 5!\u001b[0m\n", + "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:11,992][75217] Initialized w:2 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:11,993][75217] Initialized w:2 v:0 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:11,994][75253] Using port 40901 on host...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:11,995][75217] 2 agent workers initialized for env 2!\u001b[0m\n", + "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:11,997][75252] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:11,998][75252] Port 40801 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:11,998][75252] Using port 40801\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:11,999][75252] Initializing env for player 0, init_info: {'port': 40801}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,001][75218] Initialized w:3 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,001][75218] Initialized w:3 v:0 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:12,003][75218] 2 agent workers initialized for env 3!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,003][75215] Initialized w:1 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,003][75215] Initialized w:1 v:0 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:12,005][75215] 2 agent workers initialized for env 1!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,006][75217] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:12,006][75217] Port 40501 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:12,007][75217] Using port 40501\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,008][75216] Initializing env for player 0, init_info: {'port': 40301}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,009][75254] Initialized w:7 v:0 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,010][75254] Initialized w:7 v:0 player:0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:12,012][75254] 2 agent workers initialized for env 7!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,016][75215] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,016][75253] Initializing env for player 1, init_info: {'port': 40901}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:12,016][75215] Port 40401 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:12,017][75215] Using port 40401\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,017][75218] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,017][75215] Initializing env for player 0, init_info: {'port': 40401}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:12,017][75218] Port 40601 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:12,017][75218] Using port 40601\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,018][75218] Initializing env for player 0, init_info: {'port': 40601}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,029][75252] Using port 40801 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,029][75254] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:12,030][75254] UDP port 41001 cannot be used [Errno 98] Address already in use\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:12,030][75254] Port 42001 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:12,031][75254] Using port 42001\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,031][75254] Initializing env for player 0, init_info: {'port': 42001}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,038][75219] Initializing env for player 0, init_info: {'port': 40700}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,038][75216] Using port 40301 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,049][75218] Using port 40601 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,049][75252] Initializing env for player 1, init_info: {'port': 40801}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,052][75215] Using port 40401 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,058][75216] Initializing env for player 1, init_info: {'port': 40301}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,062][75254] Using port 42001 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,068][75215] Initializing env for player 1, init_info: {'port': 40401}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,068][75218] Initializing env for player 1, init_info: {'port': 40601}...\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,082][75219] Using port 40700 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,082][75254] Initializing env for player 1, init_info: {'port': 42001}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:12,089][75219] Initializing env for player 1, init_info: {'port': 40700}...\u001b[0m\n", + "Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Contacting host: /Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", "Sending all here. \n", "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI3 (node 3, player 3) \n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Found AI2 (node 4, player 4) \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) 8]\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI3 (node 2, player 3) 8]\n", - "Found AI2 (node 3, player 4) \n", - "Console player number: 2 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Console player number: 3 8]\n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI3 (node 0, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "Found AI5 (node 5, player 6) 8]\n", - "Found AI6 (node 6, player 7) \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Found AI4 (node 4, player 5) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 7 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 5, player 5) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 0, player 2) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI4 (node 4, player 5) \n", - "\n", - "Found AI5 (node 5, player 6) \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Found AI6 (node 6, player 7) \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 7, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 5, player 5) \n", - "\n", - "Go \n", - "Found AI5 (node 6, player 6) \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Found AI6 (node 7, player 7) \n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 0, player 8) \n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "\n", - "Exchanging game information.\n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Go \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI4 (node 4, player 5) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 7, player 8) \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "\n", - "Go \n", - "Total players: 8 \n", - "\u001b[36m[2023-09-12 21:01:53,664][28625] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 0. Throughput: 0: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI5 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI7 (node 6, player 7) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 1, player 2) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,759][39685] Initialized w:0 v:0 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,761][39685] Initialized w:0 v:0 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,762][39685] Initialized w:0 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,762][39685] Initialized w:0 v:0 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,762][39685] Initialized w:0 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,762][39685] Initialized w:0 v:0 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,763][39685] Initialized w:0 v:0 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,763][39685] Initialized w:0 v:0 player:0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:53,765][39685] 8 agent workers initialized for env 0!\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI3 (node 0, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 0, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI2 (node 5, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI5 (node 2, player 3) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI7 (node 7, player 7) \n", - "Found AI6 (node 0, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI3 (node 6, player 6) \n", - "Found AI7 (node 0, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI7 (node 0, player 5) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI2 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI3 (node 6, player 6) \n", - "Found AI7 (node 7, player 7) \n", - "Found AI6 (node 0, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,832][39685] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:53,833][39685] Port 40301 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:53,833][39685] Using port 40301\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,834][39685] Initializing env for player 0, init_info: {'port': 40301}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI5 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI7 (node 5, player 5) \n", - "Found AI2 (node 0, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI5 (node 2, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI2 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 5, player 5) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI2 (node 6, player 6) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI3 (node 7, player 7) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI6 (node 0, player 8) \n", - "Found AI5 (node 0, player 6) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,863][39685] Using port 40301 on host...\u001b[0m\n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "\n", - "Found AI1 (node 0, player 2) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI2 (node 1, player 2) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI7 (node 5, player 5) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI5 (node 0, player 3) \n", - "Found AI2 (node 0, player 5) \n", - "Found AI2 (node 6, player 6) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI3 (node 0, player 7) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,884][39685] Initializing env for player 1, init_info: {'port': 40301}...\u001b[0m\n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "\n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI1 (node 0, player 3) \n", - "Found AI2 (node 5, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI2 (node 3, player 3) \n", - "\n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI7 (node 0, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Found AI3 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI7 (node 0, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "\n", - "Found AI4 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI4 (node 4, player 4) \n", - "\n", - "Found AI5 (node 5, player 5) \n", - "Found AI3 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI5 (node 5, player 5) \n", - "\n", - "Found AI3 (node 6, player 6) \n", - "\n", - "Found AI6 (node 7, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "\n", - "\n", - "Found AI4 (node 4, player 4) \n", - "Found AI1 (node 2, player 2) \n", - "\n", - "Found AI3 (node 0, player 3) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI6 (node 0, player 8) \n", - "\n", - "Found AI2 (node 2, player 2) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,935][39685] Initializing env for player 2, init_info: {'port': 40301}...\u001b[0m\n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI5 (node 0, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "Found AI2 (node 2, player 2) \n", - "\n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI5 (node 5, player 5) \n", - "Found AI3 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "\n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "\n", - "\n", - "\n", - "Found AI2 (node 0, player 2) \n", - "\n", - "Found AI1 (node 2, player 3) \n", - "\n", - "Found AI4 (node 3, player 4) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,991][39697] Initialized w:1 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,992][39685] Initializing env for player 3, init_info: {'port': 40301}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,993][39697] Initialized w:1 v:0 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,994][39697] Initialized w:1 v:0 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,994][39697] Initialized w:1 v:0 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,995][39697] Initialized w:1 v:0 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,995][39697] Initialized w:1 v:0 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,995][39697] Initialized w:1 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,995][39697] Initialized w:1 v:0 player:4\u001b[0m\n", - "\n", - "\u001b[36m[2023-09-12 21:01:53,997][39697] 8 agent workers initialized for env 1!\u001b[0m\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,031][39699] Initialized w:5 v:0 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,034][39699] Initialized w:5 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,034][39699] Initialized w:5 v:0 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,034][39699] Initialized w:5 v:0 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,035][39699] Initialized w:5 v:0 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,035][39734] Initialized w:7 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,035][39699] Initialized w:5 v:0 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,036][39699] Initialized w:5 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,036][39699] Initialized w:5 v:0 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,038][39734] Initialized w:7 v:0 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,038][39734] Initialized w:7 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,038][39734] Initialized w:7 v:0 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,038][39734] Initialized w:7 v:0 player:6\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,038][39699] 8 agent workers initialized for env 5!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,039][39734] Initialized w:7 v:0 player:0\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,039][39734] Initialized w:7 v:0 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,039][39734] Initialized w:7 v:0 player:1\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,042][39734] 8 agent workers initialized for env 7!\u001b[0m\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,055][39733] Initialized w:6 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,055][39685] Initializing env for player 4, init_info: {'port': 40301}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,056][39697] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,057][39733] Initialized w:6 v:0 player:1\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,058][39697] Port 40401 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,058][39697] Using port 40401\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,058][39733] Initialized w:6 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,058][39733] Initialized w:6 v:0 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,058][39733] Initialized w:6 v:0 player:6\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,058][39697] Initializing env for player 0, init_info: {'port': 40401}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,059][39733] Initialized w:6 v:0 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,059][39733] Initialized w:6 v:0 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,059][39733] Initialized w:6 v:0 player:0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,061][39733] 8 agent workers initialized for env 6!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,064][39731] Initializing env for player 0, init_info: {'port': 40700}...\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,086][39699] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,088][39699] Port 40801 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,089][39699] Using port 40801\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,089][39699] Initializing env for player 0, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,091][39734] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,093][39734] Port 41001 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,094][39734] Using port 41001\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,094][39697] Using port 40401 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:5\u001b[0m\n", - "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", - " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,098][39731] Using port 40700 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:2\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,100][39698] 8 agent workers initialized for env 3!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,103][39685] Initializing env for player 5, init_info: {'port': 40301}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,112][39733] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,114][39733] Port 40901 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,115][39733] Using port 40901\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,115][39731] Initializing env for player 1, init_info: {'port': 40700}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,115][39733] Initializing env for player 0, init_info: {'port': 40901}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,119][39696] Initialized w:2 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,121][39696] Initialized w:2 v:0 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,121][39696] Initialized w:2 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,123][39697] Initializing env for player 1, init_info: {'port': 40401}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,124][39696] 8 agent workers initialized for env 2!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,132][39699] Using port 40801 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,141][39699] Initializing env for player 1, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,148][39698] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,149][39698] Port 40601 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,150][39698] Using port 40601\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,150][39698] Initializing env for player 0, init_info: {'port': 40601}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,157][39733] Using port 40901 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,157][39696] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,159][39696] Port 40501 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,159][39696] Using port 40501\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,166][39733] Initializing env for player 1, init_info: {'port': 40901}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,167][39685] Initializing env for player 6, init_info: {'port': 40301}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,165][39731] Initializing env for player 2, init_info: {'port': 40700}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,173][39697] Initializing env for player 2, init_info: {'port': 40401}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,179][39698] Using port 40601 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,192][39699] Initializing env for player 2, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,201][39698] Initializing env for player 1, init_info: {'port': 40601}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,213][39685] Initializing env for player 7, init_info: {'port': 40301}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,217][39731] Initializing env for player 3, init_info: {'port': 40700}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,219][39733] Initializing env for player 2, init_info: {'port': 40901}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,230][39697] Initializing env for player 3, init_info: {'port': 40401}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,242][39699] Initializing env for player 3, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,251][39698] Initializing env for player 2, init_info: {'port': 40601}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,269][39733] Initializing env for player 3, init_info: {'port': 40901}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,273][39731] Initializing env for player 4, init_info: {'port': 40700}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,283][39697] Initializing env for player 4, init_info: {'port': 40401}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,303][39698] Initializing env for player 3, init_info: {'port': 40601}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,318][39699] Initializing env for player 4, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,327][39731] Initializing env for player 5, init_info: {'port': 40700}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,339][39697] Initializing env for player 5, init_info: {'port': 40401}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,339][39733] Initializing env for player 4, init_info: {'port': 40901}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:54,355][39698] Initializing env for player 4, init_info: {'port': 40601}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:54,372][39699] Initializing env for player 5, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,387][39731] Initializing env for player 6, init_info: {'port': 40700}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,388][39733] Initializing env for player 5, init_info: {'port': 40901}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,395][39697] Initializing env for player 6, init_info: {'port': 40401}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,410][39698] Initializing env for player 5, init_info: {'port': 40601}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,427][39699] Initializing env for player 6, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,438][39733] Initializing env for player 6, init_info: {'port': 40901}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,443][39731] Initializing env for player 7, init_info: {'port': 40700}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,446][39697] Initializing env for player 7, init_info: {'port': 40401}...\u001b[0m\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:54,463][39698] Initializing env for player 6, init_info: {'port': 40601}...\u001b[0m\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:54,479][39699] Initializing env for player 7, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,499][39733] Initializing env for player 7, init_info: {'port': 40901}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,523][39698] Initializing env for player 7, init_info: {'port': 40601}...\u001b[0m\n", - "Got connect from node 1. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 2. \n", - "Waiting for players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Waiting for players: ...... [ 6/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 1. \n", - "Waiting for players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Waiting for players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. \n", - "Waiting for players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. 8]\n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Waiting for players: .... [ 4/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 6. \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 3. 8]\n", - "Got connect from node 4. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 2. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Done waiting.Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 3. 8]\n", - "Got connect from node 4. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Waiting for players: ....... [ 7/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Got connect from node 2. 8]\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Console player number: 7 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 5. 8]\n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Console player number: 2 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 8]\n", - "Waiting for other players: ....\n", - "Waiting for other players: . [ 5/ 8]....8]..\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "\n", - "Go \n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 ... 7/ 8]. [ 7/ 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "\n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "\n", - "Exchanging game information.\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "\n", - "Go \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Total players: 8 \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Go \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "Received \"Go.\" \n", - "\n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI1 (node 1, player 2) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI4 (node 6, player 7) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI2 (node 3, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Found AI1 (node 0, player 2) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI4 (node 6, player 7) \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "\n", - "Go \n", - "Found AI4 (node 0, player 7) \n", - "Total players: 8 \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "\n", - "Found AI2 (node 0, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI4 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI4 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 0, player 3) \n", - "\n", - "Exchanging game information.\n", - "Found AI2 (node 3, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI4 (node 6, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI6 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI4 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI4 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI1 (node 1, player 2) \n", - "\n", - "Found AI2 (node 2, player 3) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI4 (node 2, player 3) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI7 (node 0, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 1, player 2) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI3 (node 4, player 4) \n", - "\n", - "Found AI3 (node 0, player 6) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI6 (node 0, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 0, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "\n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI4 (node 4, player 5) \n", - "\n", - "Found AI4 (node 3, player 4) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI6 (node 0, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI3 (node 0, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI2 (node 0, player 2) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,800][39685] Initialized w:0 v:1 player:4\u001b[0m\n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI3 (node 2, player 3) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,802][39685] Initialized w:0 v:1 player:1\u001b[0m\n", - "Found AI4 (node 3, player 4) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,802][39685] Initialized w:0 v:1 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,802][39685] Initialized w:0 v:1 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,802][39685] Initialized w:0 v:1 player:7\u001b[0m\n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,803][39685] Initialized w:0 v:1 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,803][39685] Initialized w:0 v:1 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,803][39685] Initialized w:0 v:1 player:2\u001b[0m\n", - "Found AI2 (node 4, player 5) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "\u001b[36m[2023-09-12 21:01:55,805][39685] 8 agent workers initialized for env 0!\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 0, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI3 (node 6, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI3 (node 6, player 6) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI4 (node 2, player 3) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 0, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "\n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI1 (node 2, player 2) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,848][39734] Initializing env for player 0, init_info: {'port': 41001}...\u001b[0m\n", - "Found AI2 (node 5, player 5) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI2 (node 0, player 5) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI2 (node 4, player 5) \n", - "\n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "\n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,857][39685] Decorrelating experience for 32 frames...\u001b[0m\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "Found AI1 (node 2, player 2) \n", - "\n", - "Found AI3 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "\n", - "\n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,898][39734] Using port 41001 on host...\u001b[0m\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,898][39734] Initializing env for player 1, init_info: {'port': 41001}...\u001b[0m\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,931][39698] Initialized w:3 v:1 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,933][39698] Initialized w:3 v:1 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,933][39698] Initialized w:3 v:1 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:55,937][39698] 8 agent workers initialized for env 3!\u001b[0m\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,950][39734] Initializing env for player 2, init_info: {'port': 41001}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,969][39733] Initialized w:6 v:1 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,971][39733] Initialized w:6 v:1 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,971][39733] Initialized w:6 v:1 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,972][39733] Initialized w:6 v:1 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,972][39733] Initialized w:6 v:1 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,972][39733] Initialized w:6 v:1 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,973][39733] Initialized w:6 v:1 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,973][39733] Initialized w:6 v:1 player:4\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:55,974][39733] 8 agent workers initialized for env 6!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,974][39698] Decorrelating experience for 32 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,977][39731] Initialized w:4 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,977][39731] Initialized w:4 v:0 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,978][39731] Initialized w:4 v:0 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,978][39731] Initialized w:4 v:0 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,978][39731] Initialized w:4 v:0 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,978][39696] Initializing env for player 0, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,978][39731] Initialized w:4 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,979][39731] Initialized w:4 v:0 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,979][39731] Initialized w:4 v:0 player:0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:55,982][39731] 8 agent workers initialized for env 4!\u001b[0m\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,004][39697] Initialized w:1 v:1 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,007][39697] Initialized w:1 v:1 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,007][39697] Initialized w:1 v:1 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,008][39697] Initialized w:1 v:1 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,008][39697] Initialized w:1 v:1 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,008][39697] Initialized w:1 v:1 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,008][39697] Initialized w:1 v:1 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,009][39697] Initialized w:1 v:1 player:7\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,011][39697] 8 agent workers initialized for env 1!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,015][39734] Initializing env for player 3, init_info: {'port': 41001}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,024][39731] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,024][39696] Using port 40501 on host...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,029][39731] Port 40701 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,029][39731] Using port 40701\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,030][39731] Initializing env for player 0, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,030][39733] Decorrelating experience for 32 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,035][39696] Initializing env for player 1, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,042][39697] Decorrelating experience for 32 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,055][39699] Initialized w:5 v:1 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,056][39699] Initialized w:5 v:1 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,057][39699] Initialized w:5 v:1 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,057][39699] Initialized w:5 v:1 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,057][39699] Initialized w:5 v:1 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,058][39699] Initialized w:5 v:1 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,058][39699] Initialized w:5 v:1 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,059][39699] Initialized w:5 v:1 player:5\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,061][39699] 8 agent workers initialized for env 5!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,067][39734] Initializing env for player 4, init_info: {'port': 41001}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,070][39731] Using port 40701 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,080][39731] Initializing env for player 1, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,088][39696] Initializing env for player 2, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,096][39699] Decorrelating experience for 32 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,131][39731] Initializing env for player 2, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,126][39734] Initializing env for player 5, init_info: {'port': 41001}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,139][39696] Initializing env for player 3, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,179][39734] Initializing env for player 6, init_info: {'port': 41001}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,183][39731] Initializing env for player 3, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,195][39696] Initializing env for player 4, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,231][39734] Initializing env for player 7, init_info: {'port': 41001}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,235][39731] Initializing env for player 4, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,241][39696] Initializing env for player 5, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,259][39685] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,284][39731] Initializing env for player 5, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,299][39696] Initializing env for player 6, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,306][39685] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,338][39731] Initializing env for player 6, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,340][39685] Port 40302 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,340][39685] Using port 40302\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,341][39685] Initializing env for player 0, init_info: {'port': 40302}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,360][39696] Initializing env for player 7, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,367][39698] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,387][39685] Using port 40302 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,391][39731] Initializing env for player 7, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,398][39685] Initializing env for player 1, init_info: {'port': 40302}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,413][39698] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,437][39733] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,455][39685] Initializing env for player 2, init_info: {'port': 40302}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,459][39698] Port 40602 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,459][39698] Using port 40602\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,460][39698] Initializing env for player 0, init_info: {'port': 40602}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,482][39733] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,505][39698] Using port 40602 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,505][39685] Initializing env for player 3, init_info: {'port': 40302}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,509][39697] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,516][39698] Initializing env for player 1, init_info: {'port': 40602}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,528][39733] Port 40902 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,528][39733] Using port 40902\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,529][39733] Initializing env for player 0, init_info: {'port': 40902}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,553][39697] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,555][39699] Multi agent env, num agents: 8\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,557][39685] Initializing env for player 4, init_info: {'port': 40302}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,566][39698] Initializing env for player 2, init_info: {'port': 40602}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:56,573][39733] Using port 40902 on host...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,584][39733] Initializing env for player 1, init_info: {'port': 40902}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,605][39699] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,611][39685] Initializing env for player 5, init_info: {'port': 40302}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,617][39698] Initializing env for player 3, init_info: {'port': 40602}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,621][39697] Port 40402 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,621][39697] Using port 40402\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,622][39697] Initializing env for player 0, init_info: {'port': 40402}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\u001b[36m[2023-09-12 21:01:56,637][39699] Port 40802 is available\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[36m[2023-09-12 21:01:56,637][39699] Using port 40802\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,637][39699] Initializing env for player 0, init_info: {'port': 40802}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,644][39733] Initializing env for player 2, init_info: {'port': 40902}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,658][39697] Using port 40402 on host...\u001b[0m\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:56,659][39685] Initializing env for player 6, init_info: {'port': 40302}...\u001b[0m\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:56,673][39697] Initializing env for player 1, init_info: {'port': 40402}...\u001b[0m\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:56,676][39698] Initializing env for player 4, init_info: {'port': 40602}...\u001b[0m\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Waiting for players: ... [ 3/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:56,681][39699] Using port 40802 on host...\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,688][39699] Initializing env for player 1, init_info: {'port': 40802}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,707][39733] Initializing env for player 3, init_info: {'port': 40902}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,713][39685] Initializing env for player 7, init_info: {'port': 40302}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:56,726][39697] Initializing env for player 2, init_info: {'port': 40402}...\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,739][39699] Initializing env for player 2, init_info: {'port': 40802}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,747][39698] Initializing env for player 5, init_info: {'port': 40602}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,755][39733] Initializing env for player 4, init_info: {'port': 40902}...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 3. \n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:56,787][39697] Initializing env for player 3, init_info: {'port': 40402}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,790][39699] Initializing env for player 3, init_info: {'port': 40802}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,801][39698] Initializing env for player 6, init_info: {'port': 40602}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,821][39733] Initializing env for player 5, init_info: {'port': 40902}...\u001b[0m\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:56,851][39698] Initializing env for player 7, init_info: {'port': 40602}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,851][39697] Initializing env for player 4, init_info: {'port': 40402}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,856][39699] Initializing env for player 4, init_info: {'port': 40802}...\u001b[0m\n", - "Waiting for other players: ...Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: .... [ 4/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. 8]\n", - "Got connect from node 2. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,883][39733] Initializing env for player 6, init_info: {'port': 40902}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,903][39697] Initializing env for player 5, init_info: {'port': 40402}...\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,927][39699] Initializing env for player 5, init_info: {'port': 40802}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,935][39733] Initializing env for player 7, init_info: {'port': 40902}...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Got connect from node 3. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,973][39699] Initializing env for player 6, init_info: {'port': 40802}...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 3. \n", - "Got connect from node 7. 8]\n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:57,024][39699] Initializing env for player 7, init_info: {'port': 40802}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,971][39697] Initializing env for player 6, init_info: {'port': 40402}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,035][39697] Initializing env for player 7, init_info: {'port': 40402}...\u001b[0m\n", - "Got connect from node 4. 8]\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Got connect from node 4. 8]\n", - "Waiting for players: ..... [ 5/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 7 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Waiting for other players: ..... [ 5/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Waiting for players: ..... [ 5/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Go \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "Waiting for other players: ..... [ 5/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Exchanging game information.\n", - "Exchanging game information.Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Contacting host: -\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Got connect from node 1. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Waiting for players: . [ 1/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI0_host (node 1, player 1) \n", - "Got connect from node 1. \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 1. \n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 2. 8]\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Found AI7 (node 7, player 8) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI5 (node 2, player 3) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI2 (node 3, player 4) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 6, player 6) \n", - "Found AI3 (node 7, player 7) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Found AI7 (node 0, player 8) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI0_host (node 1, player 1) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 1, player 2) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 3, player 3) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI6 (node 0, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Got connect from node 2. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI5 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI6 (node 0, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI7 (node 7, player 8) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 0, player 3) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Found AI2 (node 3, player 4) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI2 (node 4, player 4) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI3 (node 6, player 7) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI6 (node 6, player 6) \n", - "Found AI3 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Found AI1 (node 2, player 2) 8]\n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Waiting for players: ....... [ 7/ 8] 7/ 8]\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "\n", - "Found AI6 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) 8]8] [ 2/ 8]\n", - "Found AI4 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI1 (node 2, player 2) 8]\n", - "\n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Contacting host: -\n", - "Found AI6 (node 6, player 6) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Found AI5 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI6 (node 6, player 6) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI1 (node 0, player 2) \n", - "\n", - "Exchanging game information.Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "\n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for players: ... [ 3/ 8] 7/ 8]\n", - "Exchanging game information.\n", - "\n", - "Contacting host: -players: ....... [ 7/ 8]\n", - "\n", - "Contacting host: -\n", - "Got connect from node 4. 8]\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Waiting for players: ....... [ 7/ 8]\n", - "Got connect from node 7. 8]\n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Got connect from node 3. \n", - "Got connect from node 4. 4/ 8].. [ 5/ 8]\n", - "Got connect from node 5. [ 5/ 8]\n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - ".. [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) 8]\n", - "....... [ 7/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:57,632][39734] Initialized w:7 v:1 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,633][39734] Initialized w:7 v:1 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,633][39734] Initialized w:7 v:1 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,634][39734] Initialized w:7 v:1 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,634][39734] Initialized w:7 v:1 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,634][39734] Initialized w:7 v:1 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,634][39734] Initialized w:7 v:1 player:6\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,635][39734] Initialized w:7 v:1 player:5\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:57,636][39734] 8 agent workers initialized for env 7!\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Waiting for other players: ....... [ 7/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Got connect from node 3. 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,687][39696] Initialized w:2 v:1 player:5\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:57,688][39696] Initialized w:2 v:1 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,688][39696] Initialized w:2 v:1 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,689][39696] Initialized w:2 v:1 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,690][39696] Initialized w:2 v:1 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,690][39696] Initialized w:2 v:1 player:2\u001b[0m\n", - "Waiting for other players: .... [ 4/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:57,691][39696] Initialized w:2 v:1 player:3\u001b[0m\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Done waiting.\u001b[37m\u001b[1m[2023-09-12 21:01:57,692][39696] Initialized w:2 v:1 player:7\u001b[0m\n", - "Found AI6 (node 6, player 7) \n", - "Found AI5 (node 5, player 6) \n", - "\u001b[36m[2023-09-12 21:01:57,692][39696] 8 agent workers initialized for env 2!\u001b[0m\n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI4 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI1 (node 2, player 2) 8]\n", - "Found AI4 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ........ [ 8/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:57,710][39734] Decorrelating experience for 32 frames...\u001b[0m\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Console player number: 2 8]\n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) 8]\n", - "Found AI4 (node 3, player 3) 8]\n", - "Found AI2 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Console player number: 3 8]\n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Waiting for other players: ........ [ 8/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:57,747][39696] Decorrelating experience for 32 frames...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Found AI1 (node 0, player 2) \n", - "Found AI4 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI4 (node 0, player 3) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) 8]\n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI3 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 8]\n", - "Received All Here, sending ACK. \n", - "\n", - "Go \n", - "Total players: 8 \n", - "\n", - "\n", - "\n", - "\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Contacting host: -\n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Done waiting.\n", - "Exchanging game information.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Go \n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:57,901][39731] Initialized w:4 v:1 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,902][39731] Initialized w:4 v:1 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,902][39731] Initialized w:4 v:1 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,902][39731] Initialized w:4 v:1 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,903][39731] Initialized w:4 v:1 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,903][39731] Initialized w:4 v:1 player:0\u001b[0m\n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:57,904][39731] Initialized w:4 v:1 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,904][39731] Initialized w:4 v:1 player:2\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:57,906][39731] 8 agent workers initialized for env 4!\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,948][39731] Decorrelating experience for 32 frames...\u001b[0m\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[36m[2023-09-12 21:01:58,004][39734] Multi agent env, num agents: 8\u001b[0m\n", - "Found AI2 (node 2, player 3) 8]\n", - "Found AI3 (node 3, player 4) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI1 (node 1, player 2) \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 1, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[36m[2023-09-12 21:01:58,038][39734] Multi agent env, num agents: 8\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 0, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI5 (node 0, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Go \n", - "Total players: 8 \n", - "\u001b[36m[2023-09-12 21:01:58,069][39734] Port 41002 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:58,069][39734] Using port 41002\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,069][39734] Initializing env for player 0, init_info: {'port': 41002}...\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI5 (node 5, player 5) \n", - "Found AI4 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI5 (node 5, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 6, player 6) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI2 (node 3, player 3) \n", - "\n", - "Found AI6 (node 7, player 7) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI3 (node 4, player 4) \n", - "Found AI5 (node 0, player 8) \n", - "Found AI5 (node 5, player 5) \n", - "Found AI4 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:58,100][39734] Using port 41002 on host...\u001b[0m\n", - "Found AI2 (node 1, player 2) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI2 (node 0, player 2) \n", - "\n", - "Go \n", - "Found AI1 (node 2, player 3) \n", - "Total players: 8 \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:58,120][39734] Initializing env for player 1, init_info: {'port': 41002}...\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "\n", - "Found AI1 (node 0, player 3) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI3 (node 0, player 5) \n", - "\n", - "Found AI5 (node 5, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,171][39734] Initializing env for player 2, init_info: {'port': 41002}...\u001b[0m\n", - "\n", - "Exchanging game information.\n", - "\u001b[36m[2023-09-12 21:01:58,185][39696] Multi agent env, num agents: 8\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "\n", - "\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,227][39734] Initializing env for player 3, init_info: {'port': 41002}...\u001b[0m\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[36m[2023-09-12 21:01:58,232][39696] Multi agent env, num agents: 8\u001b[0m\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,239][39685] Initialized w:0 v:2 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,241][39685] Initialized w:0 v:2 player:6\u001b[0m\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,242][39685] Initialized w:0 v:2 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,243][39685] Initialized w:0 v:2 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,244][39685] Initialized w:0 v:2 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,245][39685] Initialized w:0 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,246][39685] Initialized w:0 v:2 player:4\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,249][39685] Initialized w:0 v:2 player:7\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[36m[2023-09-12 21:01:58,250][39685] 8 agent workers initialized for env 0!\u001b[0m\n", - "\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,275][39734] Initializing env for player 4, init_info: {'port': 41002}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI3 (node 3, player 4) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,279][39733] Initialized w:6 v:2 player:3\u001b[0m\n", - "Found AI1 (node 1, player 2) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI2 (node 2, player 3) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,281][39733] Initialized w:6 v:2 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,281][39733] Initialized w:6 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,284][39733] Initialized w:6 v:2 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,284][39733] Initialized w:6 v:2 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,287][39733] Initialized w:6 v:2 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,287][39733] Initialized w:6 v:2 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,288][39733] Initialized w:6 v:2 player:4\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:58,289][39733] 8 agent workers initialized for env 6!\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI7 (node 5, player 5) \n", - "Found AI4 (node 6, player 6) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,310][39698] Initialized w:3 v:2 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,313][39698] Initialized w:3 v:2 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,313][39698] Initialized w:3 v:2 player:2\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[36m[2023-09-12 21:01:58,318][39698] 8 agent workers initialized for env 3!\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI7 (node 5, player 5) \n", - "Found AI4 (node 6, player 6) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI6 (node 0, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,327][39734] Initializing env for player 5, init_info: {'port': 41002}...\u001b[0m\n", - "Found AI4 (node 4, player 5) \n", - "\u001b[36m[2023-09-12 21:01:58,328][39696] Port 40502 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:58,328][39696] Using port 40502\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,329][39696] Initializing env for player 0, init_info: {'port': 40502}...\u001b[0m\n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,329][39685] Decorrelating experience for 64 frames...\u001b[0m\n", - "Found AI1 (node 1, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,343][39733] Decorrelating experience for 64 frames...\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI7 (node 0, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI7 (node 5, player 5) \n", - "Found AI4 (node 0, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,362][39696] Using port 40502 on host...\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,379][39696] Initializing env for player 1, init_info: {'port': 40502}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,379][39734] Initializing env for player 6, init_info: {'port': 41002}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,384][39698] Decorrelating experience for 64 frames...\u001b[0m\n", - "\n", - "\u001b[36m[2023-09-12 21:01:58,395][39731] Multi agent env, num agents: 8\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,431][39696] Initializing env for player 2, init_info: {'port': 40502}...\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "\u001b[36m[2023-09-12 21:01:58,434][39731] Multi agent env, num agents: 8\u001b[0m\n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,442][39734] Initializing env for player 7, init_info: {'port': 41002}...\u001b[0m\n", - "\n", - "\n", - "\n", - "\n", - "\u001b[36m[2023-09-12 21:01:58,471][39731] Port 40702 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:58,471][39731] Using port 40702\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,472][39731] Initializing env for player 0, init_info: {'port': 40702}...\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,487][39696] Initializing env for player 3, init_info: {'port': 40502}...\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,509][39731] Using port 40702 on host...\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,522][39731] Initializing env for player 1, init_info: {'port': 40702}...\u001b[0m\n", - "\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,547][39696] Initializing env for player 4, init_info: {'port': 40502}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,571][39697] Initialized w:1 v:2 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,575][39731] Initializing env for player 2, init_info: {'port': 40702}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,577][39697] Initialized w:1 v:2 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,577][39697] Initialized w:1 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,578][39697] Initialized w:1 v:2 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,578][39697] Initialized w:1 v:2 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,578][39697] Initialized w:1 v:2 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,578][39697] Initialized w:1 v:2 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,579][39697] Initialized w:1 v:2 player:5\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:58,583][39697] 8 agent workers initialized for env 1!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,594][39696] Initializing env for player 5, init_info: {'port': 40502}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,615][39699] Initialized w:5 v:2 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,619][39699] Initialized w:5 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,620][39699] Initialized w:5 v:2 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,623][39699] Initialized w:5 v:2 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,625][39699] Initialized w:5 v:2 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,626][39699] Initialized w:5 v:2 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,626][39699] Initialized w:5 v:2 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,627][39699] Initialized w:5 v:2 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,627][39731] Initializing env for player 3, init_info: {'port': 40702}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:58,628][39699] 8 agent workers initialized for env 5!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,641][39697] Decorrelating experience for 64 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,655][39696] Initializing env for player 6, init_info: {'port': 40502}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:58,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,678][39731] Initializing env for player 4, init_info: {'port': 40702}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,707][39696] Initializing env for player 7, init_info: {'port': 40502}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,717][39699] Decorrelating experience for 64 frames...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:58,731][39731] Initializing env for player 5, init_info: {'port': 40702}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:58,795][39731] Initializing env for player 6, init_info: {'port': 40702}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:58,871][39731] Initializing env for player 7, init_info: {'port': 40702}...\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 3. \n", - "Waiting for players: .... [ 4/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: .... [ 4/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ...... [ 6/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[36m[2023-09-12 21:01:59,191][39733] Port 40903 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:59,191][39733] Using port 40903\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,192][39733] Initializing env for player 0, init_info: {'port': 40903}...\u001b[0m\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:59,221][39733] Using port 40903 on host...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Got connect from node 6. 8]\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,243][39733] Initializing env for player 1, init_info: {'port': 40903}...\u001b[0m\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Total players: 8 8]\n", - "Waiting for other players: \n", - "Waiting for other players: .. [ 8/ 8]. [ 1/ 8] [ 6/ 8]\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:59,293][39733] Initializing env for player 2, init_info: {'port': 40903}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:59,302][39685] Port 40303 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:59,302][39685] Using port 40303\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,302][39685] Initializing env for player 0, init_info: {'port': 40303}...\u001b[0m\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Waiting for players: ...... [ 6/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:59,347][39685] Using port 40303 on host...\u001b[0m\n", - "Waiting for players: ...... [ 6/ 8]\u001b[36m[2023-09-12 21:01:59,347][39698] Port 40603 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:59,348][39698] Using port 40603\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,347][39733] Initializing env for player 3, init_info: {'port': 40903}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,348][39698] Initializing env for player 0, init_info: {'port': 40603}...\u001b[0m\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,360][39685] Initializing env for player 1, init_info: {'port': 40303}...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:59,392][39698] Using port 40603 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,402][39698] Initializing env for player 1, init_info: {'port': 40603}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,409][39733] Initializing env for player 4, init_info: {'port': 40903}...\u001b[0m\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,419][39685] Initializing env for player 2, init_info: {'port': 40303}...\u001b[0m\n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 3 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Contacting host: -s: ... [ 3/ 8]\n", - "Go \n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:59,459][39698] Initializing env for player 2, init_info: {'port': 40603}...\u001b[0m\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:59,467][39733] Initializing env for player 5, init_info: {'port': 40903}...\u001b[0m\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:59,470][39685] Initializing env for player 3, init_info: {'port': 40303}...\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,517][39698] Initializing env for player 3, init_info: {'port': 40603}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,519][39733] Initializing env for player 6, init_info: {'port': 40903}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Waiting for other players: ........ [ 8/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:59,523][39685] Initializing env for player 4, init_info: {'port': 40303}...\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "\n", - "Found AI6 (node 6, player 7) \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI6 (node 7, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Found AI6 (node 6, player 7) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,575][39685] Initializing env for player 5, init_info: {'port': 40303}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,575][39698] Initializing env for player 4, init_info: {'port': 40603}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,578][39733] Initializing env for player 7, init_info: {'port': 40903}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 6, player 7) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "\u001b[36m[2023-09-12 21:01:59,592][39697] Port 40403 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:59,592][39697] Using port 40403\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,592][39697] Initializing env for player 0, init_info: {'port': 40403}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 6, player 7) \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,623][39698] Initializing env for player 5, init_info: {'port': 40603}...\u001b[0m\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Waiting for other players: ...... [ 6/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:59,629][39697] Using port 40403 on host...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 6, player 7) \n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 6, player 7) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,643][39697] Initializing env for player 1, init_info: {'port': 40403}...\u001b[0m\n", - "\n", - "Go \n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI2 (node 1, player 2) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI4 (node 3, player 4) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,664][39685] Initializing env for player 6, init_info: {'port': 40303}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:59,664][39699] Port 40803 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:59,665][39699] Using port 40803\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,665][39699] Initializing env for player 0, init_info: {'port': 40803}...\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 0, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 0, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "\n", - "Exchanging game information.\n", - "Found AI2 (node 0, player 2) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:59,694][39697] Initializing env for player 2, init_info: {'port': 40403}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,695][39698] Initializing env for player 6, init_info: {'port': 40603}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:59,707][39699] Using port 40803 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,718][39699] Initializing env for player 1, init_info: {'port': 40803}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,719][39685] Initializing env for player 7, init_info: {'port': 40303}...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 0, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Exchanging game information.\n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI7 (node 0, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:59,744][39697] Initializing env for player 3, init_info: {'port': 40403}...\u001b[0m\n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:59,751][39698] Initializing env for player 7, init_info: {'port': 40603}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,768][39699] Initializing env for player 2, init_info: {'port': 40803}...\u001b[0m\n", - "\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI0_host (node 1, player 1) \n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:59,795][39697] Initializing env for player 4, init_info: {'port': 40403}...\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:59,819][39699] Initializing env for player 3, init_info: {'port': 40803}...\u001b[0m\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Go \n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Exchanging game information.\n", - "Found AI0_host (node 1, player 1) \n", - "Got connect from node 1. \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI5 (node 1, player 2) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI6 (node 6, player 7) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,857][39697] Initializing env for player 5, init_info: {'port': 40403}...\u001b[0m\n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,871][39699] Initializing env for player 4, init_info: {'port': 40803}...\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI5 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "\n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:59,887][39734] Initialized w:7 v:2 player:3\u001b[0m\n", - "Received All Here, sending ACK. \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,888][39734] Initialized w:7 v:2 player:6\u001b[0m\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,889][39734] Initialized w:7 v:2 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,890][39734] Initialized w:7 v:2 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,890][39734] Initialized w:7 v:2 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,891][39734] Initialized w:7 v:2 player:5\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,891][39734] Initialized w:7 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,892][39734] Initialized w:7 v:2 player:4\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[36m[2023-09-12 21:01:59,893][39734] 8 agent workers initialized for env 7!\u001b[0m\n", - "Found AI5 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI3 (node 0, player 6) \n", - "\n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Exchanging game information.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:59,911][39697] Initializing env for player 6, init_info: {'port': 40403}...\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", + "Done waiting.Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", "Contacting host: /Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI5 (node 0, player 2) \n", - "Found AI1 (node 2, player 3) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,931][39699] Initializing env for player 5, init_info: {'port': 40803}...\u001b[0m\n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 2, player 2) \n", - "Found AI1 (node 0, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:59,942][39734] Decorrelating experience for 64 frames...\u001b[0m\n", - "Found AI5 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI3 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI3 (node 6, player 6) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Got connect from node 2. \n", - "Waiting for players: ... [ 3/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,967][39697] Initializing env for player 7, init_info: {'port': 40403}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,979][39699] Initializing env for player 6, init_info: {'port': 40803}...\u001b[0m\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Waiting for players: . [ 1/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", "Contacting host: /Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,039][39699] Initializing env for player 7, init_info: {'port': 40803}...\u001b[0m\n", - "Found AI1 (node 1, player 2) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI4 (node 4, player 5) \n", - "\n", - "Found AI5 (node 5, player 6) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI3 (node 2, player 3) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Waiting for players: ..... [ 5/ 8]Press 'Q' to abort network game synchronization.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:02:00,070][39696] Initialized w:2 v:2 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,072][39696] Initialized w:2 v:2 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,072][39696] Initialized w:2 v:2 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,073][39696] Initialized w:2 v:2 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,073][39696] Initialized w:2 v:2 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,074][39696] Initialized w:2 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,074][39696] Initialized w:2 v:2 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,074][39696] Initialized w:2 v:2 player:4\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:00,076][39696] 8 agent workers initialized for env 2!\u001b[0m\n", - "Found AI1 (node 0, player 2) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Press 'Q' to abort network game synchronization.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ... [ 3/ 8]\n", + "Waiting for other players: .. [ 2/ 2]\n", "Got connect from node 1. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Found AI1 (node 2, player 2) 8]\n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,122][39696] Decorrelating experience for 64 frames...\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 0, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Contacting host: -\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Contacting host: -s: ....... [ 7/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "\n", - "Got connect from node 3. 8]\n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -\n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", + "Waiting for players: .. [ 2/ 2]\n", "Sending all here. \n", "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,279][39731] Initialized w:4 v:2 player:5\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:1\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:02:00,282][39731] Initialized w:4 v:2 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,282][39731] Initialized w:4 v:2 player:6\u001b[0m\n", - "Waiting for other players: ........ [ 8/ 8]\u001b[36m[2023-09-12 21:02:00,283][39731] 8 agent workers initialized for env 4!\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Got connect from node 4. 8]\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,332][39731] Decorrelating experience for 64 frames...\u001b[0m\n", - "Console player number: 7 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Got connect from node 7. 8]\n", - "Waiting for players: ........ [ 8/ 8]\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", "Sending all here. \n", "\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Waiting for players: ....... [ 7/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: \n", - "Console player number: 3 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Got connect from node 1. 8]\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Go \n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ....... [ 7/ 8]\n", + "Waiting for other players: .. [ 2/ 2]\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Got connect from node 7. 8]\n", - "Waiting for players: ........ [ 8/ 8]\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", "Sending all here. \n", "\n", "Got connect from node 1. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Got connect from node 2. \n", - "Waiting for players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[36m[2023-09-12 21:02:00,573][39734] Port 41003 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:00,573][39734] Using port 41003\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,573][39734] Initializing env for player 0, init_info: {'port': 41003}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", + "Waiting for other players: .. [ 2/ 2]\n", "\n", "Go \n", - "Total players: 8 \n", - "Total players: 8 \n", + "Total players: 2 \n", + "Total players: 2 \n", "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", + "Waiting for other players: .. [ 2/ 2]\n", + "Total players: 2 \n", "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Waiting for other players: .. [ 2/ 2]\n", "\n", - "Total players: 8 \n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Total players: 8 \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,605][39734] Using port 41003 on host...\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Total players: 2 \n", "\n", - "Total players: 8 \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Exchanging game information.\n", - "Exchanging game information.Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Waiting for other players: .. [ 2/ 2]\n", + "Total players: 2 \n", "\n", - "Total players: 8 \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", + "Waiting for other players: .. [ 2/ 2]\n", "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,624][39734] Initializing env for player 1, init_info: {'port': 41003}...\u001b[0m\n", - "\n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Exchanging game information.Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: ... [ 3/ 8]\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 3 \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI2 (node 1, player 2) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI3 (node 4, player 5) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,674][39734] Initializing env for player 2, init_info: {'port': 41003}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 6 \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Console player number: 4 8]\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", "\n", "Go \n", - "Total players: 8 \n", - "Waiting for other players: .. [ 2/ 8]\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI2 (node 0, player 2) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 6, player 7) \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI7 (node 0, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 0, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", + "Total players: 2 \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", "\n", "Exchanging game information.\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:02:00,727][39734] Initializing env for player 3, init_info: {'port': 41003}...\u001b[0m\n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "\n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "\n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI7 (node 7, player 7) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,775][39734] Initializing env for player 4, init_info: {'port': 41003}...\u001b[0m\n", - "Found AI6 (node 0, player 8) \n", + "Go \n", + "Total players: 2 \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", "Exchanging game information.\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI2 (node 2, player 3) \n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 0, player 4) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 0, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 7, player 8) \n", - "Total players: 8 \n", + "Go \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Found AI0_host (node 1, player 1) \n", + "Exchanging game information.\n", + "Go \n", + "Total players: 2 \n", "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Found AI3 (node 4, player 4) \n", - "\u001b[36m[2023-09-12 21:02:00,838][39696] Port 40503 is available\u001b[0m\n", - "Found AI4 (node 5, player 5) \n", - "\u001b[36m[2023-09-12 21:02:00,838][39696] Using port 40503\u001b[0m\n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 7, player 7) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,838][39696] Initializing env for player 0, init_info: {'port': 40503}...\u001b[0m\n", - "Found AI6 (node 0, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Console player number: 3 8]\n", + "\n", + "Exchanging game information.\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Total players: 8 \n", + "Received \"Go.\" \n", "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,847][39734] Initializing env for player 5, init_info: {'port': 41003}...\u001b[0m\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", + "Received \"Go.\" \n", "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Console player number: 4 8]\n", + "Total players: 2 \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Total players: 8 \n", + "Received \"Go.\" \n", "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,867][39696] Using port 40503 on host...\u001b[0m\n", - "Total players: 8 \n", + "Total players: 2 \n", + "Found AI1 (node 1, player 2) \n", "\n", - "Waiting for other players: ........ [ 8/ 8]\n", + "Exchanging game information.\n", + "Exchanging game information.\n", + "Go \n", + "Total players: 2 \n", "\n", + "Go \n", + "Total players: 2 \n", "\n", "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,889][39696] Initializing env for player 1, init_info: {'port': 40503}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,891][39734] Initializing env for player 6, init_info: {'port': 41003}...\u001b[0m\n", + "Received \"Go.\" \n", "\n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 2 8]\n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI4 (node 4, player 5) \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", + "Total players: 2 \n", "\n", - "Console player number: 6 8]\n", + "Exchanging game information.\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", + "Received \"Go.\" \n", "\n", + "Total players: 2 \n", "\n", + "Found AI0_host (node 1, player 1) \n", + "Found AI1 (node 0, player 2) \n", + "Found AI0_host (node 1, player 1) \n", "\n", + "Found AI0_host (node 1, player 1) \n", + "Found AI0_host (node 1, player 1) \n", + "Found AI0_host (node 1, player 1) \n", + "Found AI1 (node 1, player 2) \n", + "Found AI0_host (node 1, player 1) \n", + "Found AI1 (node 1, player 2) \n", + "Found AI1 (node 0, player 2) \n", "\n", + "Found AI1 (node 1, player 2) \n", + "Found AI1 (node 1, player 2) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,052][75253] Initialized w:6 v:1 player:0\u001b[0m\n", + "Found AI1 (node 0, player 2) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,053][75253] Initialized w:6 v:1 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,054][75253] 2 agent workers initialized for env 6!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,064][75253] Decorrelating experience for 32 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,067][75217] Initializing env for player 0, init_info: {'port': 40501}...\u001b[0m\n", + "Found AI1 (node 0, player 2) \n", + "Found AI1 (node 0, player 2) \n", + "Found AI1 (node 1, player 2) \n", + "Found AI1 (node 1, player 2) \n", + "Found AI1 (node 0, player 2) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,103][75217] Using port 40501 on host...\u001b[0m\n", "\n", - "\u001b[36m[2023-09-12 21:02:00,925][39731] Port 40703 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:00,925][39731] Using port 40703\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,926][39731] Initializing env for player 0, init_info: {'port': 40703}...\u001b[0m\n", + "Found AI1 (node 0, player 2) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,118][75217] Initializing env for player 1, init_info: {'port': 40501}...\u001b[0m\n", + "\n", + "\n", + "\u001b[36m[2023-09-14 12:37:13,135][75253] Multi agent env, num agents: 2\u001b[0m\n", + "\n", + "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,144][75254] Initialized w:7 v:1 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,144][75254] Initialized w:7 v:1 player:0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,146][75254] 2 agent workers initialized for env 7!\u001b[0m\n", + "\n", + "\u001b[36m[2023-09-14 12:37:13,164][75253] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,167][75215] Initialized w:1 v:1 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,168][75215] Initialized w:1 v:1 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,169][75254] Decorrelating experience for 32 frames...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,169][75215] 2 agent workers initialized for env 1!\u001b[0m\n", + "\n", + "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,179][75215] Decorrelating experience for 32 frames...\u001b[0m\n", + "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,188][75218] Initialized w:3 v:1 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,189][75218] Initialized w:3 v:1 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,189][75216] Initialized w:0 v:1 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,190][75216] Initialized w:0 v:1 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,190][75218] 2 agent workers initialized for env 3!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,191][75216] 2 agent workers initialized for env 0!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,194][75253] Port 40902 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,194][75253] Using port 40902\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,194][75253] Initializing env for player 0, init_info: {'port': 40902}...\u001b[0m\n", + "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,198][75216] Decorrelating experience for 32 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,200][75218] Decorrelating experience for 32 frames...\u001b[0m\n", + "\n", + "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,217][75252] Initialized w:5 v:1 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,218][75252] Initialized w:5 v:1 player:0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,219][75252] 2 agent workers initialized for env 5!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,227][75253] Using port 40902 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,228][75219] Initialized w:4 v:0 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,228][75219] Initialized w:4 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,229][75252] Decorrelating experience for 32 frames...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,230][75219] 2 agent workers initialized for env 4!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,239][75219] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,239][75219] Port 40701 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,240][75219] Using port 40701\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,240][75219] Initializing env for player 0, init_info: {'port': 40701}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,241][75254] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,245][75253] Initializing env for player 1, init_info: {'port': 40902}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,257][75215] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,266][75216] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,278][75218] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,279][75254] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,280][75219] Using port 40701 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,291][75219] Initializing env for player 1, init_info: {'port': 40701}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,301][75216] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,303][75252] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,304][75215] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[33m[2023-09-14 12:37:13,327][75254] UDP port 41002 cannot be used [Errno 98] Address already in use\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,328][75254] Port 42002 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,328][75218] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,328][75254] Using port 42002\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,330][75216] Port 40302 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,330][75216] Using port 40302\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,331][75216] Initializing env for player 0, init_info: {'port': 40302}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,350][75215] Port 40402 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,350][75252] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,350][75215] Using port 40402\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,350][75215] Initializing env for player 0, init_info: {'port': 40402}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,357][75218] Port 40602 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,357][75218] Using port 40602\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,358][75218] Initializing env for player 0, init_info: {'port': 40602}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,359][75216] Using port 40302 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,381][75216] Initializing env for player 1, init_info: {'port': 40302}...\u001b[0m\n", + "Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]\u001b[37m\u001b[1m[2023-09-14 12:37:13,385][75215] Using port 40402 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,390][75218] Using port 40602 on host...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,395][75252] Port 40802 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:13,395][75252] Using port 40802\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,396][75252] Initializing env for player 0, init_info: {'port': 40802}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,401][75215] Initializing env for player 1, init_info: {'port': 40402}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,408][75218] Initializing env for player 1, init_info: {'port': 40602}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,441][75252] Using port 40802 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:13,449][75252] Initializing env for player 1, init_info: {'port': 40802}...\u001b[0m\n", + "Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Contacting host: /Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Total players: 2 \n", "\n", - "Found AI1 (node 0, player 2) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "\n", - "\n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI7 (node 7, player 7) \n", - "Found AI6 (node 0, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) 8]\n", - "Console player number: 2 8]\n", + "Waiting for other players: .. [ 2/ 2]\n", + "Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Contacting host: -Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "\n", + "Contacting host: -\n", "Go \n", - "Total players: 8 \n", + "Total players: 2 \n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", + "Done waiting.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Contacting host: /Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Total players: 2 \n", "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,943][39734] Initializing env for player 7, init_info: {'port': 41003}...\u001b[0m\n", - "Console player number: 3 8]\n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Waiting for other players: .. [ 2/ 2]\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Total players: 8 \n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,949][39696] Initializing env for player 2, init_info: {'port': 40503}...\u001b[0m\n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Exchanging game information.\n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", - "Found AI3 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:02:00,968][39733] Initialized w:6 v:3 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,969][39733] Initialized w:6 v:3 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,969][39733] Initialized w:6 v:3 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,970][39733] Initialized w:6 v:3 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,970][39733] Initialized w:6 v:3 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,971][39731] Using port 40703 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,971][39733] Initialized w:6 v:3 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,971][39733] Initialized w:6 v:3 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,972][39733] Initialized w:6 v:3 player:0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:00,973][39733] 8 agent workers initialized for env 6!\u001b[0m\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", + "Total players: 2 \n", + "Total players: 2 \n", + "\n", + "Waiting for other players: .. [ 2/ 2]\n", "Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:02:00,984][39731] Initializing env for player 1, init_info: {'port': 40703}...\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Contacting host: /\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", + "\n", + "Total players: 2 \n", "\n", - "Total players: 8 \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI7 (node 0, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,999][39696] Initializing env for player 3, init_info: {'port': 40503}...\u001b[0m\n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", + "Waiting for other players: .. [ 2/ 2]\n", "Console player number: 1 \n", "Received All Here, sending ACK. \n", + "Total players: 2 \n", + "\n", + "Waiting for other players: .. [ 2/ 2]\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", + "\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Contacting host: -\n", + "Go \n", + "Total players: 2 \n", + "Found AI0_host (node 1, player 1) \n", + "Total players: 2 \n", "\n", - "Total players: 8 \n", + "Waiting for other players: .. [ 2/ 2]\n", "\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Go \n", - "Total players: 8 \n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", - "\n", + "Total players: 2 \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", "\n", - "Total players: 8 \n", + "Exchanging game information.\n", + "Go \n", + "Total players: 2 \n", "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,016][39733] Decorrelating experience for 96 frames...\u001b[0m\n", + "Go \n", + "Total players: 2 \n", "\n", "Exchanging game information.\n", - "Exchanging game information.\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", - "\n", + "Total players: 2 \n", + "Total players: 2 \n", "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,031][39685] Initialized w:0 v:3 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,033][39685] Initialized w:0 v:3 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,034][39685] Initialized w:0 v:3 player:5\u001b[0m\n", + "Waiting for other players: .. [ 2/ 2]\n", "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,034][39685] Initialized w:0 v:3 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,035][39685] Initialized w:0 v:3 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,035][39685] Initialized w:0 v:3 player:0\u001b[0m\n", + "Found AI1 (node 1, player 2) \n", "\n", + "Go \n", + "Total players: 2 \n", + "Found AI1 (node 0, player 2) \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,039][39685] Initialized w:0 v:3 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,042][39731] Initializing env for player 2, init_info: {'port': 40703}...\u001b[0m\n", "\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", + "Total players: 2 \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Total players: 2 \n", "\n", - "Total players: 8 \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,051][39696] Initializing env for player 4, init_info: {'port': 40503}...\u001b[0m\n", + "Found AI0_host (node 1, player 1) \n", "\n", "Exchanging game information.\n", - "Found AI0_host (node 1, player 1) \n", + "Go \n", + "Total players: 2 \n", "\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", + "Found AI0_host (node 1, player 1) \n", "\n", "\n", - "Found AI0_host (node 1, player 1) \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Found AI0_host (node 1, player 1) \n", + "Go \n", + "Total players: 2 \n", + "Found AI1 (node 1, player 2) \n", "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,095][39731] Initializing env for player 3, init_info: {'port': 40703}...\u001b[0m\n", + "Exchanging game information.\u001b[37m\u001b[1m[2023-09-14 12:37:14,216][75217] Initialized w:2 v:1 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,217][75217] Initialized w:2 v:1 player:0\u001b[0m\n", "\n", + "Exchanging game information.\u001b[36m[2023-09-14 12:37:14,219][75217] 2 agent workers initialized for env 2!\u001b[0m\n", + "Found AI0_host (node 1, player 1) \n", + "Found AI1 (node 0, player 2) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,233][75217] Decorrelating experience for 32 frames...\u001b[0m\n", + "Found AI0_host (node 1, player 1) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,239][75254] Initializing env for player 0, init_info: {'port': 42002}...\u001b[0m\n", + "Found AI1 (node 1, player 2) \n", + "Found AI1 (node 1, player 2) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,279][75254] Using port 42002 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,289][75254] Initializing env for player 1, init_info: {'port': 42002}...\u001b[0m\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", + "Total players: 2 \n", + "Found AI1 (node 0, player 2) \n", "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,129][39696] Initializing env for player 5, init_info: {'port': 40503}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,153][39698] Initialized w:3 v:3 player:6\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,157][39698] Initialized w:3 v:3 player:4\u001b[0m\n", - "Found AI6 (node 3, player 4) \n", - "Found AI2 (node 4, player 5) \n", + "Exchanging game information.\u001b[36m[2023-09-14 12:37:14,302][75217] Multi agent env, num agents: 2\u001b[0m\n", "Found AI1 (node 1, player 2) \n", - "Found AI4 (node 2, player 3) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:5\u001b[0m\n", - "Found AI3 (node 6, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:2\u001b[0m\n", - "Found AI5 (node 5, player 6) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:0\u001b[0m\n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,160][39698] Initialized w:3 v:3 player:3\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:01,162][39698] 8 agent workers initialized for env 3!\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI2 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,180][39731] Initializing env for player 4, init_info: {'port': 40703}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,183][39696] Initializing env for player 6, init_info: {'port': 40503}...\u001b[0m\n", + "\n", "Found AI0_host (node 1, player 1) \n", "Found AI1 (node 0, player 2) \n", - "Found AI4 (node 2, player 3) \n", - "Found AI6 (node 3, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI3 (node 2, player 3) work game synchronization.\n", - "Found AI2 (node 4, player 5) \n", - "Found AI6 (node 3, player 4) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "\n", - "Found AI5 (node 7, player 8) .\n", "\n", - "Found AI1 (node 1, player 2) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 0, player 3) \n", - "Found AI6 (node 3, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI3 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,233][39731] Initializing env for player 5, init_info: {'port': 40703}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,236][39698] Decorrelating experience for 96 frames...\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI3 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,251][39696] Initializing env for player 7, init_info: {'port': 40503}...\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 0, player 3) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 3, player 4) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI2 (node 0, player 5) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI6 (node 0, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI6 (node 0, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI4 (node 0, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI4 (node 6, player 6) \n", - "Found AI7 (node 0, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI4 (node 6, player 6) \n", - "Found AI7 (node 7, player 7) \n", - "Found AI5 (node 0, player 8) \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,303][39731] Initializing env for player 6, init_info: {'port': 40703}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,334][75217] Multi agent env, num agents: 2\u001b[0m\n", "Found AI1 (node 0, player 2) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI6 (node 3, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -s: . [ 1/ 8]\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,350][75253] Initialized w:6 v:2 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,351][75253] Initialized w:6 v:2 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,353][75253] 2 agent workers initialized for env 6!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,363][75253] Decorrelating experience for 64 frames...\u001b[0m\n", "\n", + "\u001b[36m[2023-09-14 12:37:14,374][75217] Port 40502 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,374][75217] Using port 40502\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,374][75217] Initializing env for player 0, init_info: {'port': 40502}...\u001b[0m\n", "\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", + "Found AI1 (node 1, player 2) \n", "\n", + "Found AI0_host (node 1, player 1) \n", "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,409][75217] Using port 40502 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,412][75216] Initialized w:0 v:2 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,413][75216] Initialized w:0 v:2 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,414][75216] 2 agent workers initialized for env 0!\u001b[0m\n", + "Found AI1 (node 0, player 2) \n", + "Found AI1 (node 1, player 2) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,425][75217] Initializing env for player 1, init_info: {'port': 40502}...\u001b[0m\n", "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,432][75216] Decorrelating experience for 64 frames...\u001b[0m\n", "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,440][75219] Initialized w:4 v:1 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,441][75219] Initialized w:4 v:1 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,443][75219] 2 agent workers initialized for env 4!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,452][75219] Decorrelating experience for 32 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,453][75218] Initialized w:3 v:2 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,453][75218] Initialized w:3 v:2 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,455][75218] 2 agent workers initialized for env 3!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,467][75218] Decorrelating experience for 64 frames...\u001b[0m\n", "\n", + "Found AI1 (node 0, player 2) \n", + "\u001b[36m[2023-09-14 12:37:14,504][75253] Port 40903 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,504][75253] Using port 40903\u001b[0m\n", "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,369][39731] Initializing env for player 7, init_info: {'port': 40703}...\u001b[0m\n", "\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Waiting for players: ... [ 3/ 8]\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,533][75215] Initialized w:1 v:2 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,534][75215] Initialized w:1 v:2 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,535][75219] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,535][75215] 2 agent workers initialized for env 1!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,542][75215] Decorrelating experience for 64 frames...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,581][75219] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,600][75216] Port 40303 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,600][75216] Using port 40303\u001b[0m\n", + "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,613][75252] Initialized w:5 v:2 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,614][75252] Initialized w:5 v:2 player:0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,614][75252] 2 agent workers initialized for env 5!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,624][75252] Decorrelating experience for 64 frames...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,626][75219] Port 40702 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,626][75219] Using port 40702\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,627][75219] Initializing env for player 0, init_info: {'port': 40702}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,628][75218] Port 40603 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,629][75218] Using port 40603\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,629][75218] Initializing env for player 0, init_info: {'port': 40603}...\u001b[0m\n", "Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:02:01,413][39697] Initialized w:1 v:3 player:3\u001b[0m\n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,415][39697] Initialized w:1 v:3 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,417][39697] Initialized w:1 v:3 player:0\u001b[0m\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:02:01,417][39697] Initialized w:1 v:3 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,418][39697] Initialized w:1 v:3 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,420][39697] Initialized w:1 v:3 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,421][39697] Initialized w:1 v:3 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,422][39697] Initialized w:1 v:3 player:5\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "\u001b[36m[2023-09-12 21:02:01,423][39697] 8 agent workers initialized for env 1!\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", + "Contacting host: /\u001b[37m\u001b[1m[2023-09-14 12:37:14,658][75219] Using port 40702 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,659][75218] Using port 40603 on host...\u001b[0m\n", + "Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:02:01,459][39699] Initialized w:5 v:3 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,461][39699] Initialized w:5 v:3 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,461][39699] Initialized w:5 v:3 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,462][39699] Initialized w:5 v:3 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,463][39699] Initialized w:5 v:3 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,466][39699] Initialized w:5 v:3 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,466][39699] Initialized w:5 v:3 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,466][39699] Initialized w:5 v:3 player:3\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:01,467][39699] 8 agent workers initialized for env 5!\u001b[0m\n", - "Got connect from node 3. \n", - "Waiting for players: .... [ 4/ 8]\u001b[37m\u001b[1m[2023-09-12 21:02:01,494][39697] Decorrelating experience for 96 frames...\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", + "Waiting for players: . [ 1/ 2]\u001b[37m\u001b[1m[2023-09-14 12:37:14,679][75219] Initializing env for player 1, init_info: {'port': 40702}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,680][75218] Initializing env for player 1, init_info: {'port': 40603}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,712][75215] Port 40403 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,712][75215] Using port 40403\u001b[0m\n", + "Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", + "Contacting host: -Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. 8]\n", - "Total players: 8 8]\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,540][39699] Decorrelating experience for 96 frames...\u001b[0m\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", + "Done waiting.\u001b[36m[2023-09-14 12:37:14,781][75252] Port 40803 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:14,782][75252] Using port 40803\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,782][75252] Initializing env for player 0, init_info: {'port': 40803}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:14,810][75252] Using port 40803 on host...\u001b[0m\n", + "Waiting for players: . [ 1/ 2]\u001b[37m\u001b[1m[2023-09-14 12:37:14,832][75252] Initializing env for player 1, init_info: {'port': 40803}...\u001b[0m\n", + "Total players: 2 \n", "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: .... [ 4/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Total players: 8 \n", + "Waiting for other players: .. [ 2/ 2]\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 8]\n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Got connect from node 1. 8]\n", - "Waiting for players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", + "Waiting for other players: .. [ 2/ 2]\n", "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", + "Go \n", + "Total players: 2 \n", + "\n", + "Exchanging game information.Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", "Contacting host: /Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Got connect from node 6. \n", - "Waiting for players: ....... [ 7/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", + "Waiting for players: . [ 1/ 2]Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", + "Received \"Go.\" \n", "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Got connect from node 2. 8]\n", - "Total players: 8 8]\n", + "Total players: 2 \n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Got connect from node 7. 8]\n", - "Waiting for players: ........ [ 8/ 8]\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", "Sending all here. \n", "\n", - "Got connect from node 3. 8]\n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", + "Done waiting.Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Contacting host: /\n", + "Go \n", + "Total players: 2 \n", + "Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Contacting host: /\n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", + "Received \"Go.\" \n", "\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", + "Total players: 2 \n", + "Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Got connect from node 2. 8]\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Total players: 8 \n", + "Found AI0_host (node 1, player 1) \n", "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 8]\n", + "Found AI1 (node 1, player 2) \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", + "Waiting for other players: .. [ 2/ 2]\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", + "Found AI1 (node 0, player 2) \n", + "Found AI0_host (node 1, player 1) \n", "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Total players: 8 \n", + "Done waiting.\n", + "Go \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 \n", + "Waiting for other players: .. [ 2/ 2]\n", + "Total players: 2 \n", "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", + "Waiting for other players: .. [ 2/ 2]\n", + "Found AI1 (node 1, player 2) \n", "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", + "Found AI1 (node 0, player 2) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,373][75254] Initialized w:7 v:2 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,374][75254] Initialized w:7 v:2 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:15,375][75254] 2 agent workers initialized for env 7!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,385][75254] Decorrelating experience for 64 frames...\u001b[0m\n", "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,032][39685] Initialized w:0 v:3 player:2\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:02,033][39685] 8 agent workers initialized for env 0!\u001b[0m\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Got connect from node 5. \n", - "Console player number: 3 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 7 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", + "Received \"Go.\" \n", + "\n", + "Total players: 2 \n", + "\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Console player number: 6 ..... [ 8/ 8]\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,414][75216] Initializing env for player 0, init_info: {'port': 40303}...\u001b[0m\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ...... [ 6/ 8]\n", + "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,443][75216] Using port 40303 on host...\u001b[0m\n", + "\n", "Go \n", - "Total players: 8 \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", + "Total players: 2 \n", + "\n", + "\n", + "Exchanging game information.\u001b[37m\u001b[1m[2023-09-14 12:37:15,465][75216] Initializing env for player 1, init_info: {'port': 40303}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,474][75217] Initialized w:2 v:2 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,475][75217] Initialized w:2 v:2 player:0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:15,477][75217] 2 agent workers initialized for env 2!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,492][75217] Decorrelating experience for 64 frames...\u001b[0m\n", + "Found AI0_host (node 1, player 1) \n", "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:02:02,105][39685] Decorrelating experience for 96 frames...\u001b[0m\n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", + "Go \n", + "Total players: 2 \n", "\n", - "Total players: 8 \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", + "Total players: 2 \n", + "Found AI1 (node 1, player 2) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,515][75253] Initializing env for player 0, init_info: {'port': 40903}...\u001b[0m\n", + "\n", + "Exchanging game information.\u001b[36m[2023-09-14 12:37:15,529][75254] Port 41003 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:15,529][75254] Using port 41003\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,529][75254] Initializing env for player 0, init_info: {'port': 41003}...\u001b[0m\n", "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Exchanging game information.\u001b[37m\u001b[1m[2023-09-14 12:37:15,548][75253] Using port 40903 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,565][75253] Initializing env for player 1, init_info: {'port': 40903}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,567][75254] Using port 41003 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,580][75254] Initializing env for player 1, init_info: {'port': 41003}...\u001b[0m\n", + "Found AI1 (node 0, player 2) \n", "\n", - "Total players: 8 \n", + "Found AI0_host (node 1, player 1) \n", + "\u001b[36m[2023-09-14 12:37:15,636][75217] Port 40503 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:15,636][75217] Using port 40503\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,636][75217] Initializing env for player 0, init_info: {'port': 40503}...\u001b[0m\n", + "Found AI0_host (node 1, player 1) \n", + "Found AI1 (node 1, player 2) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,665][75217] Using port 40503 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,687][75217] Initializing env for player 1, init_info: {'port': 40503}...\u001b[0m\n", "\n", - "Go \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Found AI1 (node 1, player 2) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,710][75218] Initialized w:3 v:3 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,711][75218] Initialized w:3 v:3 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:15,712][75218] 2 agent workers initialized for env 3!\u001b[0m\n", + "Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Found AI1 (node 0, player 2) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,722][75218] Decorrelating experience for 96 frames...\u001b[0m\n", + "Found AI1 (node 0, player 2) \n", "\n", - "Total players: 8 \n", + "Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Contacting host: /\n", + "Waiting for players: . [ 1/ 2]\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,837][75219] Initialized w:4 v:2 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,837][75219] Initialized w:4 v:2 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:15,839][75219] 2 agent workers initialized for env 4!\u001b[0m\n", "\n", - "Total players: 8 \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,849][75219] Decorrelating experience for 64 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,855][75252] Initialized w:5 v:3 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,856][75252] Initialized w:5 v:3 player:0\u001b[0m\n", + "Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]\u001b[36m[2023-09-14 12:37:15,857][75252] 2 agent workers initialized for env 5!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,866][75252] Decorrelating experience for 96 frames...\u001b[0m\n", + "Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Contacting host: -\u001b[37m\u001b[1m[2023-09-14 12:37:15,873][75215] Initializing env for player 0, init_info: {'port': 40403}...\u001b[0m\n", + "Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Done waiting.\u001b[37m\u001b[1m[2023-09-14 12:37:15,918][75215] Using port 40403 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,926][75215] Initializing env for player 1, init_info: {'port': 40403}...\u001b[0m\n", + "Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Total players: 2 \n", "\n", - "Total players: 8 \n", - "Total players: 8 \n", + "Waiting for other players: .. [ 2/ 2]\n", + "Press 'Q' to abort network game synchronization.\u001b[36m[2023-09-14 12:37:15,983][75219] Port 40703 is available\u001b[0m\n", "\n", - "Waiting for other players: ...... [ 6/ 8]\n", + "Network game synchronization timeout: 4s.\n", + "Contacting host: /\u001b[36m[2023-09-14 12:37:15,983][75219] Using port 40703\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:15,983][75219] Initializing env for player 0, init_info: {'port': 40703}...\u001b[0m\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Done waiting.Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]\u001b[37m\u001b[1m[2023-09-14 12:37:16,013][75219] Using port 40703 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:16,034][75219] Initializing env for player 1, init_info: {'port': 40703}...\u001b[0m\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Got connect from node 6. \n", + "Waiting for other players: .. [ 2/ 2]\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Total players: 8 \n", + "Done waiting.\n", + "Go \n", + "Total players: 2 \n", "\n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", + "Total players: 2 \n", "\n", - "Total players: 8 \n", + "Waiting for other players: .. [ 2/ 2]\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", + "Total players: 2 \n", "\n", - "Total players: 8 \n", - "Contacting host: -\n", - "Exchanging game information.\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Total players: 2 \n", "\n", - "Total players: 8 \n", + "Waiting for other players: .. [ 2/ 2]\n", "\n", - "Total players: 8 8]\n", + "Go \n", + "Total players: 2 \n", + "Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Waiting for players: . [ 1/ 2]\n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", + "\n", + "Go \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ....... [ 7/ 8]\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", + "Total players: 2 \n", "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", "\n", - "Found AI0_host (node 1, player 1) \n", - "Total players: 8 8]\n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) 8]\n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI6 (node 6, player 6) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 0, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI6 (node 0, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI4 (node 7, player 8) \n", + "Go \n", + "Total players: 2 \n", + "Waiting for players: . [ 1/ 2]\n", "Found AI1 (node 1, player 2) \n", - "Found AI1 (node 2, player 2) 8]\n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI4 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI4 (node 7, player 8) \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI6 (node 6, player 6) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI6 (node 0, player 5) \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI4 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 0, player 6) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI4 (node 7, player 8) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI4 (node 7, player 8) \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI4 (node 0, player 8) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "\n", + "Received \"Go.\" \n", "\n", + "Total players: 2 \n", + "Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Contacting host: /\n", + "Exchanging game information.Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Contacting host: /Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI4 (node 7, player 8) \n", - "\n", + "Found AI0_host (node 1, player 1) \n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", + "Received \"Go.\" \n", "\n", + "Total players: 2 \n", "\n", + "Found AI1 (node 1, player 2) \n", "\n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", + "Found AI0_host (node 1, player 1) \n", + "Found AI1 (node 1, player 2) \n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", + "Done waiting.\n", + "Found AI1 (node 0, player 2) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:16,489][75216] Initialized w:0 v:3 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:16,489][75216] Initialized w:0 v:3 player:0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:16,490][75216] 2 agent workers initialized for env 0!\u001b[0m\n", + "Found AI0_host (node 1, player 1) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:16,498][75216] Decorrelating experience for 96 frames...\u001b[0m\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", "\n", - "Go \n", - "Total players: 8 \n", + "Done waiting.\n", + "Found AI1 (node 1, player 2) \n", + "Found AI1 (node 0, player 2) \n", + "Total players: 2 \n", "\n", + "Waiting for other players: .. [ 2/ 2]\n", "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Total players: 2 \n", "\n", - "Total players: 8 \n", + "Waiting for other players: .. [ 2/ 2]\n", "\n", + "Found AI1 (node 0, player 2) \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:16,597][75253] Initialized w:6 v:3 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:16,599][75253] Initialized w:6 v:3 player:0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:16,600][75253] 2 agent workers initialized for env 6!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:16,614][75253] Decorrelating experience for 96 frames...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:16,619][109198] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 6832128. Throughput: 0: 0.0, 1: 42.0. Samples: 210. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", "\n", - "Total players: 8 \n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:16,671][75254] Initialized w:7 v:3 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:16,672][75254] Initialized w:7 v:3 player:1\u001b[0m\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "\u001b[36m[2023-09-14 12:37:16,673][75254] 2 agent workers initialized for env 7!\u001b[0m\n", "\n", - "Total players: 8 \n", + "Go \n", + "Total players: 2 \n", "\n", + "Exchanging game information.\u001b[37m\u001b[1m[2023-09-14 12:37:16,683][75254] Decorrelating experience for 96 frames...\u001b[0m\n", "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:16,710][75217] Initialized w:2 v:3 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:16,711][75217] Initialized w:2 v:3 player:0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:16,712][75217] 2 agent workers initialized for env 2!\u001b[0m\n", "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Exchanging game information.\n", + "Go \n", + "Total players: 2 \n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:16,721][75217] Decorrelating experience for 96 frames...\u001b[0m\n", "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,510][39734] Initialized w:7 v:3 player:2\u001b[0m\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,511][39734] Initialized w:7 v:3 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,512][39734] Initialized w:7 v:3 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,512][39734] Initialized w:7 v:3 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,512][39734] Initialized w:7 v:3 player:1\u001b[0m\n", + "Console player number: 1 \n", "Received All Here, sending ACK. \n", "Received \"Go.\" \n", "\n", - "Total players: 8 \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,513][39734] Initialized w:7 v:3 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,513][39734] Initialized w:7 v:3 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,514][39734] Initialized w:7 v:3 player:6\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:02,515][39734] 8 agent workers initialized for env 7!\u001b[0m\n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", + "Total players: 2 \n", "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:02:02,555][39734] Decorrelating experience for 96 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,559][39696] Initialized w:2 v:3 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,560][39696] Initialized w:2 v:3 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,560][39696] Initialized w:2 v:3 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,560][39696] Initialized w:2 v:3 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,560][39696] Initialized w:2 v:3 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,561][39696] Initialized w:2 v:3 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,561][39696] Initialized w:2 v:3 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,561][39696] Initialized w:2 v:3 player:7\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:02,563][39696] 8 agent workers initialized for env 2!\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,612][39696] Decorrelating experience for 96 frames...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", "Found AI0_host (node 1, player 1) \n", "Found AI0_host (node 1, player 1) \n", "Found AI1 (node 1, player 2) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 5, player 6) \n", + "Found AI1 (node 1, player 2) \n", "Found AI1 (node 0, player 2) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 0, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 0, player 8) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 0, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,881][39731] Initialized w:4 v:3 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,884][39731] Initialized w:4 v:3 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,884][39731] Initialized w:4 v:3 player:0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:02,887][39731] 8 agent workers initialized for env 4!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,948][39731] Decorrelating experience for 96 frames...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:05,178][39537] Signal inference workers to stop experience collection...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:05,203][39686] InferenceWorker_p0-w0: stopping experience collection\u001b[0m\n", + "Found AI1 (node 0, player 2) \n", + "\n", + "\n", + "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:17,079][75219] Initialized w:4 v:3 player:1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:17,080][75219] Initialized w:4 v:3 player:0\u001b[0m\n", + "\n", + "\u001b[36m[2023-09-14 12:37:17,082][75219] 2 agent workers initialized for env 4!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:17,092][75219] Decorrelating experience for 96 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:17,098][75215] Initialized w:1 v:3 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:17,099][75215] Initialized w:1 v:3 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:17,100][75215] 2 agent workers initialized for env 1!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:17,111][75215] Decorrelating experience for 96 frames...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:18,407][74942] Signal inference workers to stop experience collection...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:18,414][75209] InferenceWorker_p1-w0: stopping experience collection\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:18,418][75214] InferenceWorker_p0-w0: stopping experience collection\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/torch/nn/modules/module.py:1501: UserWarning: operator() profile_node %43 : int[] = prim::profile_ivalue(%axis.1)\n", + " does not have profile information (Triggered internally at ../third_party/nvfuser/csrc/graph_fuser.cpp:104.)\n", + " return forward_call(*args, **kwargs)\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/torch/nn/modules/module.py:1501: UserWarning: operator() profile_node %43 : int[] = prim::profile_ivalue(%axis.1)\n", " does not have profile information (Triggered internally at ../third_party/nvfuser/csrc/graph_fuser.cpp:104.)\n", " return forward_call(*args, **kwargs)\n", - "\u001b[31m\u001b[1m[2023-09-12 21:02:06,207][39537] EvtLoop [learner_proc0_evt_loop, process=learner_proc0] unhandled exception in slot='on_new_training_batch' connected to emitter=Emitter(object_id='Batcher_0', signal_name='training_batches_available'), args=(0,)\u001b[0m\n", - "Traceback (most recent call last):\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py\", line 355, in _process_signal\n", - " slot_callable(*args)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner_worker.py\", line 150, in on_new_training_batch\n", - " stats = self.learner.train(self.batcher.training_batches[batch_idx])\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 1046, in train\n", - " train_stats = self._train(buff, self.cfg.batch_size, experience_size, num_invalids)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 731, in _train\n", - " ) = self._calculate_losses(mb, num_invalids)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 649, in _calculate_losses\n", - " exploration_loss = self.exploration_loss_func(action_distribution, valids, num_invalids)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 477, in _symmetric_kl_exploration_loss\n", - " kl_prior = action_distribution.symmetric_kl_with_uniform_prior()\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py\", line 247, in symmetric_kl_with_uniform_prior\n", - " sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions]\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py\", line 247, in \n", - " sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions]\n", - "AttributeError: 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior'\n", - "\u001b[33m[2023-09-12 21:02:06,208][39537] Unhandled exception 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' in evt loop learner_proc0_evt_loop\u001b[0m\n", - "Process learner_proc0:\n", - "Traceback (most recent call last):\n", - " File \"/home/cogstack/miniconda3/lib/python3.10/multiprocessing/process.py\", line 314, in _bootstrap\n", - " self.run()\n", - " File \"/home/cogstack/miniconda3/lib/python3.10/multiprocessing/process.py\", line 108, in run\n", - " self._target(*self._args, **self._kwargs)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py\", line 511, in _target\n", - " self.event_loop.exec()\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py\", line 403, in exec\n", - " raise exc\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py\", line 399, in exec\n", - " while self._loop_iteration():\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py\", line 383, in _loop_iteration\n", - " self._process_signal(s)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py\", line 358, in _process_signal\n", - " raise exc\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py\", line 355, in _process_signal\n", - " slot_callable(*args)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner_worker.py\", line 150, in on_new_training_batch\n", - " stats = self.learner.train(self.batcher.training_batches[batch_idx])\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 1046, in train\n", - " train_stats = self._train(buff, self.cfg.batch_size, experience_size, num_invalids)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 731, in _train\n", - " ) = self._calculate_losses(mb, num_invalids)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 649, in _calculate_losses\n", - " exploration_loss = self.exploration_loss_func(action_distribution, valids, num_invalids)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 477, in _symmetric_kl_exploration_loss\n", - " kl_prior = action_distribution.symmetric_kl_with_uniform_prior()\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py\", line 247, in symmetric_kl_with_uniform_prior\n", - " sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions]\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py\", line 247, in \n", - " sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions]\n", - "AttributeError: 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior'\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,931][28625] Heartbeat connected on Batcher_0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,938][28625] Heartbeat connected on InferenceWorker_p0-w0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,944][28625] Heartbeat connected on RolloutWorker_w0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,949][28625] Heartbeat connected on RolloutWorker_w1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,953][28625] Heartbeat connected on RolloutWorker_w2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,957][28625] Heartbeat connected on RolloutWorker_w3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,961][28625] Heartbeat connected on RolloutWorker_w4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,965][28625] Heartbeat connected on RolloutWorker_w5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,968][28625] Heartbeat connected on RolloutWorker_w6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,973][28625] Heartbeat connected on RolloutWorker_w7\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 483.2. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 362.4. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 289.9. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 241.6. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 207.1. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 181.2. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 161.1. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 161.1. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 161.1. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:33,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:48,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:28,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:23,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:28,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:43,670][28625] Components not started: LearnerWorker_p0, wait_time=600.0 seconds\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:38,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:48,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:53,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:58,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:23,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:28,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:13,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:18,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:33,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:33,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:43,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:43,670][28625] Components not started: LearnerWorker_p0, wait_time=1200.0 seconds\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:28,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:43,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:48,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:53,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:43,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:31:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:31:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:31:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:31:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:31:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:31:27,821][28625] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 28625], exiting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:31:27,823][28625] Runner profile tree view:\n", - "main_loop: 1780.8502\u001b[0m\n", - "\u001b[36m[2023-09-12 21:31:27,824][39537] Stopping Batcher_0...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:31:27,825][28625] Collected {0: 0}, FPS: 0.0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:31:27,825][39537] Loop batcher_evt_loop terminating...\u001b[0m\n" + "\u001b[36m[2023-09-14 12:37:21,400][74942] Signal inference workers to resume experience collection...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:21,401][75214] InferenceWorker_p0-w0: resuming experience collection\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:21,401][75209] InferenceWorker_p1-w0: resuming experience collection\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:21,619][109198] Fps is (10 sec: 409.6, 60 sec: 409.6, 300 sec: 409.6). Total num frames: 6836224. Throughput: 0: 276.8, 1: 204.4. Samples: 4812. Policy #0 lag: (min: 0.0, avg: 0.0, max: 0.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:23,290][75052] Signal inference workers to stop experience collection...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:23,730][109198] Heartbeat connected on Batcher_0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:23,734][109198] Heartbeat connected on LearnerWorker_p0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:23,739][109198] Heartbeat connected on Batcher_1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:23,748][109198] Heartbeat connected on InferenceWorker_p0-w0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:23,754][109198] Heartbeat connected on InferenceWorker_p1-w0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:23,760][109198] Heartbeat connected on RolloutWorker_w0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:23,764][109198] Heartbeat connected on RolloutWorker_w1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:23,768][75052] Signal inference workers to resume experience collection...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:23,768][109198] Heartbeat connected on RolloutWorker_w2\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:23,772][109198] Heartbeat connected on RolloutWorker_w3\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:23,777][109198] Heartbeat connected on RolloutWorker_w4\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:23,781][109198] Heartbeat connected on RolloutWorker_w5\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:23,806][109198] Heartbeat connected on RolloutWorker_w6\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:23,815][109198] Heartbeat connected on RolloutWorker_w7\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:24,239][109198] Heartbeat connected on LearnerWorker_p1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:26,619][109198] Fps is (10 sec: 6144.1, 60 sec: 4096.0, 300 sec: 4096.0). Total num frames: 6893568. Throughput: 0: 562.1, 1: 390.4. Samples: 14288. Policy #0 lag: (min: 0.0, avg: 1.1, max: 3.0)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:27,219][75214] Updated weights for policy 0, policy_version 1197 (0.0697)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:29,320][75209] Updated weights for policy 1, policy_version 491 (0.0018)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:31,619][109198] Fps is (10 sec: 12288.3, 60 sec: 6348.8, 300 sec: 6348.8). Total num frames: 6959104. Throughput: 0: 690.6, 1: 697.4. Samples: 27760. Policy #0 lag: (min: 0.0, avg: 0.9, max: 2.0)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:32,425][75214] Updated weights for policy 0, policy_version 1207 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:36,248][75209] Updated weights for policy 1, policy_version 501 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:36,619][109198] Fps is (10 sec: 13516.9, 60 sec: 7864.3, 300 sec: 7864.3). Total num frames: 7028736. Throughput: 0: 1047.8, 1: 743.8. Samples: 44789. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:37,225][75214] Updated weights for policy 0, policy_version 1217 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:41,619][109198] Fps is (10 sec: 14745.6, 60 sec: 9147.8, 300 sec: 9147.8). Total num frames: 7106560. Throughput: 0: 1297.6, 1: 918.7. Samples: 66489. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:42,111][75214] Updated weights for policy 0, policy_version 1227 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:42,915][75209] Updated weights for policy 1, policy_version 511 (0.0013)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:46,619][109198] Fps is (10 sec: 14745.6, 60 sec: 9830.4, 300 sec: 9830.4). Total num frames: 7176192. Throughput: 0: 1298.3, 1: 1051.7. Samples: 82250. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:46,871][75214] Updated weights for policy 0, policy_version 1237 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:49,876][75209] Updated weights for policy 1, policy_version 521 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:51,619][109198] Fps is (10 sec: 13926.2, 60 sec: 10342.4, 300 sec: 10342.4). Total num frames: 7245824. Throughput: 0: 1439.7, 1: 1022.9. Samples: 98505. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:51,894][75214] Updated weights for policy 0, policy_version 1247 (0.0015)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:54,390][75253] DAMAGECOUNT value on done: 85.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:54,391][75253] DAMAGECOUNT value on done: 105.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:54,392][75253] Sum rewards: 5.616, reward structure: {'HEALTH': '-0.850', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.024', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.196', 'WEAPON3': '0.200', 'weapon2': '0.362', 'weapon3': '0.968', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon5': '2.436'}\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:54,701][75253] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:55,030][75253] DAMAGECOUNT value on done: 320.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:55,030][75253] DAMAGECOUNT value on done: 355.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:55,031][75253] Sum rewards: 5.033, reward structure: {'HEALTH': '-3.400', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.025', 'weapon5': '0.038', 'AMMO3': '0.103', 'weapon2': '0.110', 'AMMO4': '0.123', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'weapon4': '0.618', 'WEAPON3': '0.800', 'weapon3': '2.796', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.200'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:55,031][75253] Sum rewards: 5.421, reward structure: {'HEALTH': '-3.150', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.013', 'AMMO5': '0.015', 'AMMO4': '0.066', 'AMMO3': '0.066', 'weapon2': '0.152', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.344', 'WEAPON3': '0.600', 'weapon5': '0.604', 'weapon3': '2.560', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.550'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:56,044][75215] DAMAGECOUNT value on done: 36.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:56,044][75215] DAMAGECOUNT value on done: 0.0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:56,229][75215] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:56,475][75209] Updated weights for policy 1, policy_version 531 (0.0013)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:56,619][109198] Fps is (10 sec: 14335.9, 60 sec: 10831.7, 300 sec: 10831.7). Total num frames: 7319552. Throughput: 0: 1559.4, 1: 1115.8. Samples: 120388. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:56,620][109198] Avg episode reward: [(0, '4.320')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:56,621][74942] Saving new best policy, reward=4.320!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:56,637][75215] DAMAGECOUNT value on done: 230.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:56,637][75215] DAMAGECOUNT value on done: 215.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:56,638][75215] Sum rewards: 6.437, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.008', 'AMMO5': '0.010', 'AMMO3': '0.039', 'AMMO4': '0.041', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.836', 'weapon5': '0.990', 'FRAGCOUNT': '2.000', 'weapon3': '2.112', 'DAMAGECOUNT': '2.300'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:56,638][75215] Sum rewards: 2.275, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'AMMO4': '-0.003', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.017', 'weapon4': '0.038', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'WEAPON5': '0.400', 'weapon5': '0.444', 'weapon2': '0.748', 'WEAPON3': '0.800', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '2.150', 'weapon3': '2.474'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:56,750][75218] DAMAGECOUNT value on done: 65.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:56,750][75218] DAMAGECOUNT value on done: 0.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:56,926][75214] Updated weights for policy 0, policy_version 1257 (0.0013)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:56,937][75218] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,274][75218] DAMAGECOUNT value on done: 100.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,275][75218] DAMAGECOUNT value on done: 45.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,275][75218] Sum rewards: 4.505, reward structure: {'HEALTH': '-0.450', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.020', 'AMMO4': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.270', 'weapon4': '0.576', 'weapon3': '0.668', 'weapon5': '0.896', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,276][75218] Sum rewards: 0.874, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.008', 'AMMO3': '0.070', 'weapon5': '0.098', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.450', 'weapon2': '0.454', 'weapon4': '0.552', 'WEAPON3': '0.600', 'weapon3': '2.336'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,703][75217] DAMAGECOUNT value on done: 212.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,704][75217] DAMAGECOUNT value on done: 165.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,705][75217] Sum rewards: 5.886, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.007', 'weapon2': '0.044', 'AMMO3': '0.048', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.482', 'weapon5': '1.488', 'weapon3': '1.496', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.120'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,705][75217] Sum rewards: 0.386, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.024', 'AMMO3': '0.047', 'weapon5': '0.054', 'AMMO4': '0.119', 'weapon2': '0.176', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'weapon4': '0.766', 'FRAGCOUNT': '0.999', 'weapon3': '1.640', 'DAMAGECOUNT': '1.650'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,801][75219] DAMAGECOUNT value on done: 205.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,801][75219] Sum rewards: 6.653, reward structure: {'HEALTH': '-0.100', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.370', 'FRAGCOUNT': '1.000', 'weapon3': '1.010', 'weapon5': '1.798', 'DAMAGECOUNT': '2.050'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,802][75219] DAMAGECOUNT value on done: 10.0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:57,877][75217] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,888][75218] DAMAGECOUNT value on done: 168.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,888][75218] DAMAGECOUNT value on done: 215.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,889][75218] Sum rewards: 2.902, reward structure: {'HEALTH': '-2.050', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.015', 'weapon2': '0.050', 'AMMO3': '0.059', 'AMMO4': '0.076', 'WEAPON5': '0.100', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon4': '0.978', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.680', 'weapon3': '2.180'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:57,889][75218] Sum rewards: 4.623, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.011', 'AMMO4': '0.053', 'AMMO3': '0.058', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.336', 'weapon4': '0.412', 'WEAPON3': '0.500', 'weapon2': '0.658', 'FRAGCOUNT': '1.999', 'weapon3': '2.036', 'DAMAGECOUNT': '2.150'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,240][75217] DAMAGECOUNT value on done: 32.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,240][75217] DAMAGECOUNT value on done: 10.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,387][75219] DAMAGECOUNT value on done: 60.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,387][75219] DAMAGECOUNT value on done: 213.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,388][75219] Sum rewards: 6.148, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.224', 'WEAPON3': '0.400', 'weapon4': '0.450', 'weapon5': '0.470', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.130', 'weapon3': '2.226'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,419][75253] DAMAGECOUNT value on done: 130.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,420][75253] DAMAGECOUNT value on done: 95.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,420][75253] Sum rewards: 1.805, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.049', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.462', 'weapon4': '0.508', 'weapon2': '0.598', 'DAMAGECOUNT': '1.300', 'weapon3': '2.032'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,421][75253] Sum rewards: 2.915, reward structure: {'HEALTH': '-1.550', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.320', 'weapon2': '0.388', 'WEAPON3': '0.400', 'weapon5': '0.872', 'DAMAGECOUNT': '0.950', 'weapon3': '2.188'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,475][75218] DAMAGECOUNT value on done: 30.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,475][75218] DAMAGECOUNT value on done: 100.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,476][75218] Sum rewards: 5.986, reward structure: {'HEALTH': '-0.300', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'weapon2': '0.046', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.224', 'weapon3': '0.982', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon5': '2.610'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,504][75252] DAMAGECOUNT value on done: 173.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,505][75252] Sum rewards: 3.111, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.033', 'weapon5': '0.064', 'WEAPON5': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.430', 'FRAGCOUNT': '1.000', 'weapon3': '1.378', 'DAMAGECOUNT': '1.730'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,505][75252] DAMAGECOUNT value on done: 105.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,505][75252] Sum rewards: 2.757, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.018', 'AMMO3': '0.081', 'AMMO4': '0.087', 'WEAPON5': '0.200', 'weapon5': '0.298', 'WEAPON4': '0.300', 'weapon2': '0.304', 'WEAPON3': '0.600', 'weapon4': '0.952', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '1.858'}\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:58,594][75219] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:58,743][75252] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,841][75217] DAMAGECOUNT value on done: 121.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,843][75217] Sum rewards: 4.644, reward structure: {'HEALTH': '-0.950', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.024', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon2': '0.152', 'WEAPON3': '0.200', 'weapon4': '0.262', 'weapon3': '0.854', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.210', 'weapon5': '1.664'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,844][75217] DAMAGECOUNT value on done: 95.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,929][75219] DAMAGECOUNT value on done: 55.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,930][75219] DAMAGECOUNT value on done: 295.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:58,931][75219] Sum rewards: 7.326, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.050', 'AMMO3': '0.052', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.512', 'weapon4': '0.522', 'weapon5': '1.090', 'weapon3': '1.436', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.950'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,093][75253] DAMAGECOUNT value on done: 12.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,093][75253] DAMAGECOUNT value on done: 30.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,094][75253] Sum rewards: 1.796, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.005', 'AMMO4': '0.024', 'AMMO3': '0.051', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.120', 'weapon4': '0.248', 'weapon2': '0.290', 'WEAPON3': '0.400', 'weapon5': '1.024', 'weapon3': '1.432'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,103][75252] DAMAGECOUNT value on done: 10.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,103][75252] DAMAGECOUNT value on done: 12.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,237][75216] DAMAGECOUNT value on done: 0.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,238][75216] DAMAGECOUNT value on done: 110.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,239][75216] Sum rewards: 6.223, reward structure: {'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.015', 'weapon2': '0.016', 'AMMO3': '0.020', 'AMMO4': '0.074', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.532', 'weapon3': '0.862', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon5': '2.200'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,493][75217] DAMAGECOUNT value on done: 30.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,493][75217] DAMAGECOUNT value on done: 0.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,519][75219] DAMAGECOUNT value on done: 0.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,520][75219] DAMAGECOUNT value on done: 30.0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:37:59,521][75216] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,890][75252] DAMAGECOUNT value on done: 0.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,891][75252] DAMAGECOUNT value on done: 15.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,891][75252] Sum rewards: 1.939, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.004', 'AMMO2': '0.010', 'AMMO3': '0.049', 'AMMO4': '0.050', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.216', 'WEAPON3': '0.400', 'weapon4': '0.596', 'weapon5': '0.980', 'weapon3': '1.334'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,935][75216] DAMAGECOUNT value on done: 208.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,936][75216] Sum rewards: 3.081, reward structure: {'HEALTH': '-2.600', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.011', 'AMMO5': '0.012', 'AMMO4': '0.056', 'AMMO3': '0.072', 'WEAPON4': '0.200', 'weapon4': '0.294', 'WEAPON5': '0.300', 'weapon5': '0.408', 'weapon2': '0.410', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '2.080', 'weapon3': '2.236'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,936][75216] DAMAGECOUNT value on done: 260.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:37:59,936][75216] Sum rewards: 6.828, reward structure: {'HEALTH': '-1.350', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.013', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.252', 'weapon2': '0.366', 'WEAPON3': '0.400', 'weapon5': '1.138', 'FRAGCOUNT': '2.000', 'weapon3': '2.056', 'DAMAGECOUNT': '2.600'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:00,236][75215] DAMAGECOUNT value on done: 105.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:00,237][75215] DAMAGECOUNT value on done: 65.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:00,237][75215] Sum rewards: 5.756, reward structure: {'HEALTH': '-0.650', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.019', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.344', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.092', 'weapon5': '2.626'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:00,238][75215] Sum rewards: -0.390, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.007', 'AMMO4': '0.034', 'AMMO3': '0.048', 'WEAPON5': '0.100', 'weapon4': '0.146', 'weapon5': '0.158', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.518', 'DAMAGECOUNT': '0.650', 'weapon3': '1.346'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:00,489][75252] DAMAGECOUNT value on done: 0.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:00,489][75252] DAMAGECOUNT value on done: 64.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:00,579][75216] DAMAGECOUNT value on done: 5.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:00,579][75216] DAMAGECOUNT value on done: 50.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:00,610][75254] DAMAGECOUNT value on done: 115.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:00,610][75254] DAMAGECOUNT value on done: 0.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:00,611][75254] Sum rewards: 4.088, reward structure: {'HEALTH': '-0.250', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.049', 'weapon2': '0.070', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.198', 'WEAPON3': '0.200', 'weapon4': '0.452', 'weapon3': '0.986', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150'}\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:00,823][75254] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:00,857][75215] DAMAGECOUNT value on done: 35.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:00,857][75215] DAMAGECOUNT value on done: 0.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:00,858][75215] Sum rewards: 2.594, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.692', 'weapon5': '1.436', 'weapon3': '1.878'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:01,398][75254] DAMAGECOUNT value on done: 20.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:01,398][75254] DAMAGECOUNT value on done: 45.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:01,399][75254] Sum rewards: 1.904, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.010', 'AMMO4': '0.050', 'AMMO3': '0.053', 'WEAPON5': '0.100', 'weapon2': '0.158', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.450', 'weapon4': '0.608', 'weapon5': '0.774', 'weapon3': '1.098'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:01,430][75216] DAMAGECOUNT value on done: 130.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:01,431][75216] Sum rewards: 3.852, reward structure: {'HEALTH': '-0.450', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.050', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.306', 'weapon4': '0.394', 'weapon3': '0.922', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.300'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:01,430][75216] DAMAGECOUNT value on done: 45.0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:01,619][109198] Fps is (10 sec: 13926.4, 60 sec: 11059.2, 300 sec: 11059.2). Total num frames: 7385088. Throughput: 0: 1676.3, 1: 1333.4. Samples: 135650. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:01,620][109198] Avg episode reward: [(0, '3.747'), (1, '2.728')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:02,130][75254] DAMAGECOUNT value on done: 15.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:02,130][75254] DAMAGECOUNT value on done: 280.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:02,131][75254] Sum rewards: 7.995, reward structure: {'HEALTH': '-0.150', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'weapon4': '0.098', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.350', 'weapon3': '1.028', 'weapon5': '1.446', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.800'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:02,358][75209] Updated weights for policy 1, policy_version 541 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:02,754][75254] DAMAGECOUNT value on done: 205.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:02,754][75254] DAMAGECOUNT value on done: 155.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:02,755][75254] Sum rewards: 6.024, reward structure: {'HEALTH': '-1.550', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.328', 'weapon2': '0.360', 'WEAPON3': '0.400', 'weapon5': '1.140', 'weapon3': '1.948', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:02,755][75254] Sum rewards: 2.768, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO4': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.059', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.278', 'WEAPON3': '0.500', 'weapon2': '0.510', 'weapon4': '0.566', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.550', 'weapon3': '1.894'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:03,003][75214] Updated weights for policy 0, policy_version 1267 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:06,619][109198] Fps is (10 sec: 14336.0, 60 sec: 11468.8, 300 sec: 11468.8). Total num frames: 7462912. Throughput: 0: 1829.0, 1: 1419.1. Samples: 150977. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:06,620][109198] Avg episode reward: [(0, '3.919'), (1, '2.659')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:07,616][75209] Updated weights for policy 1, policy_version 551 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:08,797][75214] Updated weights for policy 0, policy_version 1277 (0.0013)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:11,619][109198] Fps is (10 sec: 14745.6, 60 sec: 11673.6, 300 sec: 11673.6). Total num frames: 7532544. Throughput: 0: 1933.9, 1: 1591.6. Samples: 172937. Policy #0 lag: (min: 0.0, avg: 0.3, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:11,620][109198] Avg episode reward: [(0, '3.919'), (1, '2.659')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:13,083][75209] Updated weights for policy 1, policy_version 561 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:14,833][75214] Updated weights for policy 0, policy_version 1287 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:16,619][109198] Fps is (10 sec: 14745.7, 60 sec: 12970.7, 300 sec: 11972.9). Total num frames: 7610368. Throughput: 0: 1931.3, 1: 1670.5. Samples: 189839. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:16,620][109198] Avg episode reward: [(0, '3.919'), (1, '2.659')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:18,054][75209] Updated weights for policy 1, policy_version 571 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:20,511][75214] Updated weights for policy 0, policy_version 1297 (0.0014)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:21,619][109198] Fps is (10 sec: 14745.6, 60 sec: 14063.0, 300 sec: 12112.5). Total num frames: 7680000. Throughput: 0: 1891.8, 1: 1701.3. Samples: 206476. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:21,620][109198] Avg episode reward: [(0, '3.919'), (1, '2.659')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:23,325][75209] Updated weights for policy 1, policy_version 581 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:26,471][75214] Updated weights for policy 0, policy_version 1307 (0.0013)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:26,619][109198] Fps is (10 sec: 14745.6, 60 sec: 14404.3, 300 sec: 12342.6). Total num frames: 7757824. Throughput: 0: 1836.8, 1: 1755.5. Samples: 228146. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:26,620][109198] Avg episode reward: [(0, '3.919'), (1, '2.659')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:28,710][75209] Updated weights for policy 1, policy_version 591 (0.0015)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:30,318][75219] DAMAGECOUNT value on done: 405.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:30,318][75219] DAMAGECOUNT value on done: 385.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:30,319][75219] Sum rewards: 3.032, reward structure: {'HEALTH': '-3.650', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'weapon5': '0.028', 'weapon2': '0.038', 'AMMO2': '0.043', 'AMMO3': '0.099', 'AMMO4': '0.215', 'WEAPON4': '0.300', 'weapon4': '0.386', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'DAMAGECOUNT': '2.000', 'FRAGCOUNT': '2.000', 'weapon3': '3.352'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:30,319][75219] Sum rewards: 7.420, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.017', 'AMMO3': '0.057', 'AMMO4': '0.084', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.248', 'weapon2': '0.414', 'WEAPON3': '0.500', 'weapon5': '0.530', 'weapon3': '2.410', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.750'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:30,844][75219] DAMAGECOUNT value on done: 380.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:30,844][75219] DAMAGECOUNT value on done: 413.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:30,845][75219] Sum rewards: 6.972, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.015', 'AMMO3': '0.056', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.298', 'weapon2': '0.476', 'WEAPON3': '0.500', 'weapon5': '0.734', 'weapon3': '2.280', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.200'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:30,845][75219] Sum rewards: 2.875, reward structure: {'HEALTH': '-3.200', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.012', 'AMMO4': '0.024', 'weapon2': '0.034', 'AMMO3': '0.107', 'weapon5': '0.146', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.544', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.000', 'weapon3': '2.902'}\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:31,619][109198] Fps is (10 sec: 14745.7, 60 sec: 14472.5, 300 sec: 12441.6). Total num frames: 7827456. Throughput: 0: 1809.3, 1: 1804.6. Samples: 244875. Policy #0 lag: (min: 0.0, avg: 0.3, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:31,620][109198] Avg episode reward: [(0, '4.032'), (1, '2.659')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:31,716][75253] DAMAGECOUNT value on done: 150.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:31,717][75253] DAMAGECOUNT value on done: 245.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:31,718][75253] Sum rewards: 3.961, reward structure: {'HEALTH': '-0.630', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.050', 'weapon5': '0.056', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.242', 'weapon4': '0.374', 'weapon3': '0.836', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.600'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:32,324][75253] DAMAGECOUNT value on done: 365.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:32,325][75253] DAMAGECOUNT value on done: 430.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:32,325][75253] Sum rewards: 4.670, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.009', 'AMMO4': '0.025', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.416', 'weapon2': '0.492', 'weapon5': '0.962', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.100', 'weapon3': '1.922'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:32,764][75214] Updated weights for policy 0, policy_version 1317 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:33,567][75218] DAMAGECOUNT value on done: 30.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:33,567][75218] DAMAGECOUNT value on done: 65.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:33,568][75218] Sum rewards: 2.507, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.021', 'AMMO3': '0.042', 'AMMO4': '0.104', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.300', 'weapon5': '0.308', 'weapon4': '0.358', 'WEAPON3': '0.400', 'weapon2': '0.454', 'weapon3': '2.112'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:33,582][75216] Large shaping reward 2.942 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 2.0), ('DAMAGECOUNT', 1.94, 194.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,152][75218] DAMAGECOUNT value on done: 345.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,152][75218] DAMAGECOUNT value on done: 350.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,153][75218] Sum rewards: 3.818, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.015', 'AMMO4': '0.075', 'weapon5': '0.090', 'AMMO3': '0.105', 'WEAPON4': '0.200', 'weapon4': '0.228', 'WEAPON5': '0.300', 'weapon2': '0.444', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.450', 'weapon3': '3.096'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,153][75218] Sum rewards: 6.422, reward structure: {'HEALTH': '-2.400', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.004', 'AMMO5': '0.010', 'AMMO2': '0.018', 'AMMO3': '0.052', 'AMMO4': '0.090', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon5': '0.410', 'WEAPON3': '0.500', 'weapon4': '0.566', 'weapon3': '2.622', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.050'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,225][75209] Updated weights for policy 1, policy_version 601 (0.0016)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,361][75215] DAMAGECOUNT value on done: 105.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,361][75215] DAMAGECOUNT value on done: 146.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,361][75215] Sum rewards: 2.843, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.006', 'AMMO5': '0.014', 'AMMO4': '0.028', 'AMMO3': '0.085', 'weapon2': '0.282', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.584', 'WEAPON3': '0.600', 'weapon5': '0.636', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '1.958'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,362][75215] Sum rewards: 4.650, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.714', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon5': '1.292', 'weapon3': '2.004'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,760][75218] DAMAGECOUNT value on done: 215.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,760][75218] DAMAGECOUNT value on done: 233.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,761][75218] Sum rewards: 2.931, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.015', 'AMMO3': '0.040', 'AMMO4': '0.076', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.282', 'weapon5': '0.318', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.650', 'weapon4': '0.704', 'weapon3': '2.038'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,908][75215] DAMAGECOUNT value on done: 260.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,909][75215] DAMAGECOUNT value on done: 312.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:34,909][75215] Sum rewards: 2.972, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.022', 'AMMO3': '0.051', 'AMMO4': '0.109', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon2': '0.204', 'weapon4': '0.330', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.970', 'weapon5': '1.310', 'weapon3': '1.468'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,333][75218] DAMAGECOUNT value on done: 100.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,333][75218] DAMAGECOUNT value on done: 197.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,334][75218] Sum rewards: 2.955, reward structure: {'HEALTH': '-1.420', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.314', 'weapon2': '0.346', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.700', 'weapon5': '1.178', 'weapon3': '2.090'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,467][75219] DAMAGECOUNT value on done: 256.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,467][75219] DAMAGECOUNT value on done: 500.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,468][75219] Sum rewards: 2.326, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.015', 'AMMO3': '0.034', 'AMMO4': '0.074', 'WEAPON5': '0.100', 'weapon5': '0.170', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.420', 'weapon4': '0.670', 'FRAGCOUNT': '1.000', 'weapon3': '1.330', 'DAMAGECOUNT': '2.010'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,468][75219] Sum rewards: 5.543, reward structure: {'HEALTH': '-1.780', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.008', 'AMMO4': '0.040', 'AMMO3': '0.040', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.350', 'WEAPON3': '0.400', 'weapon4': '0.424', 'weapon5': '0.646', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050', 'weapon3': '2.060'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,526][75217] DAMAGECOUNT value on done: 317.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,527][75217] DAMAGECOUNT value on done: 237.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,527][75217] Sum rewards: 4.308, reward structure: {'HEALTH': '-1.020', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'AMMO3': '0.040', 'AMMO4': '0.075', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.534', 'weapon5': '0.564', 'weapon4': '0.606', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '1.740'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,720][75253] DAMAGECOUNT value on done: 185.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,721][75253] DAMAGECOUNT value on done: 110.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,721][75253] Sum rewards: 2.541, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.150', 'WEAPON3': '0.200', 'weapon2': '0.706', 'weapon3': '0.888', 'weapon5': '2.474'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,995][75219] DAMAGECOUNT value on done: 353.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,995][75219] DAMAGECOUNT value on done: 140.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,996][75219] Sum rewards: 6.954, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO5': '0.007', 'AMMO2': '0.015', 'AMMO3': '0.040', 'AMMO4': '0.073', 'weapon5': '0.186', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.404', 'weapon3': '1.996', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '3.530'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:35,996][75219] Sum rewards: 2.196, reward structure: {'HEALTH': '-2.680', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.014', 'AMMO5': '0.015', 'AMMO4': '0.071', 'AMMO3': '0.075', 'weapon2': '0.108', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon5': '0.504', 'WEAPON3': '0.600', 'weapon4': '0.728', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '2.160'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,101][75217] DAMAGECOUNT value on done: 132.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,101][75217] DAMAGECOUNT value on done: 120.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,102][75217] Sum rewards: 2.674, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.017', 'AMMO3': '0.080', 'AMMO4': '0.084', 'weapon5': '0.148', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon2': '0.348', 'WEAPON3': '0.600', 'weapon4': '0.906', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '1.878'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,102][75217] Sum rewards: 4.655, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.298', 'FRAGCOUNT': '1.000', 'weapon3': '1.092', 'DAMAGECOUNT': '1.100', 'weapon5': '2.710'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,239][75252] DAMAGECOUNT value on done: 417.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,239][75252] DAMAGECOUNT value on done: 390.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,240][75252] Sum rewards: 4.150, reward structure: {'HEALTH': '-2.800', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO5': '0.012', 'AMMO2': '0.013', 'AMMO4': '0.067', 'AMMO3': '0.073', 'WEAPON4': '0.200', 'weapon5': '0.290', 'WEAPON5': '0.300', 'weapon4': '0.390', 'WEAPON3': '0.600', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.440', 'weapon3': '2.562'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,240][75252] Sum rewards: 5.150, reward structure: {'HEALTH': '-2.290', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.010', 'AMMO3': '0.077', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.288', 'weapon2': '0.410', 'weapon5': '0.522', 'WEAPON3': '0.600', 'FRAGCOUNT': '2.000', 'weapon3': '2.378', 'DAMAGECOUNT': '2.850'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,332][75253] DAMAGECOUNT value on done: 172.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,332][75253] DAMAGECOUNT value on done: 75.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,333][75253] Sum rewards: 3.105, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.015', 'AMMO3': '0.040', 'AMMO4': '0.075', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.206', 'WEAPON3': '0.400', 'weapon5': '0.580', 'weapon4': '0.712', 'FRAGCOUNT': '0.998', 'DAMAGECOUNT': '1.600', 'weapon3': '2.072'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,500][75217] DAMAGECOUNT value on done: 186.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,500][75217] DAMAGECOUNT value on done: 163.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,501][75217] Sum rewards: 2.675, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'AMMO3': '0.048', 'AMMO4': '0.074', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.490', 'weapon4': '0.548', 'DAMAGECOUNT': '0.650', 'weapon2': '0.760', 'weapon3': '1.436'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,501][75217] Sum rewards: 2.276, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.008', 'AMMO3': '0.036', 'AMMO4': '0.038', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.300', 'weapon4': '0.360', 'weapon2': '0.408', 'DAMAGECOUNT': '0.680', 'weapon3': '1.040', 'weapon5': '1.202'}\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:36,619][109198] Fps is (10 sec: 13926.3, 60 sec: 14472.5, 300 sec: 12528.9). Total num frames: 7897088. Throughput: 0: 1744.4, 1: 1836.4. Samples: 259640. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:36,620][109198] Avg episode reward: [(0, '4.024'), (1, '2.752')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,718][75252] DAMAGECOUNT value on done: 40.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:36,718][75252] DAMAGECOUNT value on done: 78.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:37,064][75217] DAMAGECOUNT value on done: 218.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:37,065][75217] DAMAGECOUNT value on done: 70.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:37,065][75217] Sum rewards: 4.290, reward structure: {'HEALTH': '-0.700', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.020', 'weapon2': '0.048', 'AMMO4': '0.099', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.148', 'WEAPON3': '0.200', 'weapon4': '0.616', 'weapon3': '0.754', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.880'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:37,341][75252] DAMAGECOUNT value on done: 5.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:37,341][75252] DAMAGECOUNT value on done: 65.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,011][75252] DAMAGECOUNT value on done: 169.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,011][75252] DAMAGECOUNT value on done: 104.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,012][75252] Sum rewards: 4.528, reward structure: {'HEALTH': '-1.250', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.010', 'weapon2': '0.036', 'AMMO3': '0.040', 'AMMO4': '0.049', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.560', 'weapon4': '0.648', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.690', 'weapon3': '1.938'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,212][75216] DAMAGECOUNT value on done: 371.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,212][75216] DAMAGECOUNT value on done: 165.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,213][75216] Sum rewards: 3.386, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.022', 'AMMO3': '0.059', 'AMMO4': '0.107', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon2': '0.362', 'WEAPON3': '0.500', 'weapon4': '0.548', 'weapon5': '0.580', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.650', 'weapon3': '2.050'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,382][75215] DAMAGECOUNT value on done: 70.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,382][75215] DAMAGECOUNT value on done: 190.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,383][75215] Sum rewards: 2.399, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.004', 'FRAGCOUNT': '-0.001', 'AMMO2': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.188', 'weapon2': '0.194', 'WEAPON3': '0.400', 'weapon5': '0.444', 'DAMAGECOUNT': '0.850', 'weapon3': '2.084'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,952][75216] DAMAGECOUNT value on done: 421.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,952][75216] DAMAGECOUNT value on done: 370.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,952][75216] Sum rewards: 5.509, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.042', 'AMMO4': '0.050', 'weapon5': '0.052', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.254', 'WEAPON3': '0.400', 'weapon4': '0.654', 'weapon3': '1.714', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.130'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,953][75216] Sum rewards: 2.499, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.005', 'AMMO4': '0.014', 'AMMO3': '0.067', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.180', 'weapon2': '0.272', 'weapon4': '0.358', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '2.800'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,955][75215] DAMAGECOUNT value on done: 125.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,956][75215] DAMAGECOUNT value on done: 0.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,956][75215] Sum rewards: 2.379, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.003', 'AMMO4': '0.011', 'AMMO3': '0.032', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON6': '0.200', 'weapon6': '0.208', 'weapon4': '0.282', 'WEAPON3': '0.300', 'weapon5': '0.324', 'weapon2': '0.496', 'DAMAGECOUNT': '0.900', 'weapon3': '1.222'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:38,957][75215] Sum rewards: 1.090, reward structure: {'HEALTH': '-1.700', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO2': '0.008', 'AMMO5': '0.009', 'AMMO4': '0.038', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.274', 'WEAPON3': '0.400', 'weapon4': '0.412', 'weapon2': '0.466', 'weapon3': '1.844'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:39,080][75214] Updated weights for policy 0, policy_version 1327 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:39,511][75209] Updated weights for policy 1, policy_version 611 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:39,659][75216] DAMAGECOUNT value on done: 70.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:39,659][75216] DAMAGECOUNT value on done: 25.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:39,660][75216] Sum rewards: 2.726, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.746', 'weapon5': '1.086', 'weapon3': '2.106'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:39,708][75254] DAMAGECOUNT value on done: 123.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:39,709][75254] DAMAGECOUNT value on done: 36.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:40,157][75216] DAMAGECOUNT value on done: 339.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:40,157][75216] DAMAGECOUNT value on done: 70.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:40,157][75216] Sum rewards: 5.200, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.013', 'AMMO3': '0.052', 'AMMO4': '0.065', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon2': '0.212', 'WEAPON3': '0.400', 'weapon4': '0.506', 'FRAGCOUNT': '0.999', 'weapon5': '1.300', 'weapon3': '1.358', 'DAMAGECOUNT': '2.090'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:40,290][75254] DAMAGECOUNT value on done: 320.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:40,291][75254] DAMAGECOUNT value on done: 440.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:40,291][75254] Sum rewards: 4.346, reward structure: {'HEALTH': '-3.850', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.015', 'weapon5': '0.016', 'AMMO5': '0.020', 'AMMO4': '0.075', 'AMMO3': '0.079', 'weapon2': '0.120', 'WEAPON4': '0.200', 'weapon4': '0.384', 'WEAPON5': '0.400', 'WEAPON3': '0.700', 'DAMAGECOUNT': '3.000', 'FRAGCOUNT': '3.000', 'weapon3': '3.186'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:40,292][75254] Sum rewards: 6.381, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.027', 'weapon2': '0.040', 'AMMO3': '0.100', 'AMMO4': '0.137', 'WEAPON4': '0.300', 'weapon4': '0.302', 'WEAPON5': '0.400', 'WEAPON3': '0.700', 'weapon5': '1.058', 'weapon3': '2.346', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.950'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:40,839][75254] DAMAGECOUNT value on done: 345.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:40,840][75254] DAMAGECOUNT value on done: 15.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:41,427][75254] DAMAGECOUNT value on done: 205.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:41,427][75254] DAMAGECOUNT value on done: 160.0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:41,619][109198] Fps is (10 sec: 14336.0, 60 sec: 14404.2, 300 sec: 12652.1). Total num frames: 7970816. Throughput: 0: 1689.9, 1: 1881.1. Samples: 281083. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:41,620][109198] Avg episode reward: [(0, '3.949'), (1, '2.782')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:44,805][75214] Updated weights for policy 0, policy_version 1337 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:45,045][75209] Updated weights for policy 1, policy_version 621 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:46,619][109198] Fps is (10 sec: 14336.0, 60 sec: 14404.3, 300 sec: 12719.2). Total num frames: 8040448. Throughput: 0: 1692.0, 1: 1896.6. Samples: 297136. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:46,620][109198] Avg episode reward: [(0, '3.949'), (1, '2.782')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:50,394][75214] Updated weights for policy 0, policy_version 1347 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:50,833][75209] Updated weights for policy 1, policy_version 631 (0.0014)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:51,619][109198] Fps is (10 sec: 14336.0, 60 sec: 14472.5, 300 sec: 12820.5). Total num frames: 8114176. Throughput: 0: 1716.8, 1: 1888.5. Samples: 313219. Policy #0 lag: (min: 0.0, avg: 0.7, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:51,620][109198] Avg episode reward: [(0, '3.949'), (1, '2.782')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:55,270][75218] Large shaping reward 2.562 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 2.0), ('DAMAGECOUNT', 1.56, 156.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:55,789][75214] Updated weights for policy 0, policy_version 1357 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:38:56,294][75209] Updated weights for policy 1, policy_version 641 (0.0013)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:56,619][109198] Fps is (10 sec: 14745.7, 60 sec: 14472.5, 300 sec: 12912.2). Total num frames: 8187904. Throughput: 0: 1741.2, 1: 1883.5. Samples: 336048. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:38:56,620][109198] Avg episode reward: [(0, '3.949'), (1, '2.782')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:00,989][75214] Updated weights for policy 0, policy_version 1367 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:01,560][75209] Updated weights for policy 1, policy_version 651 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:01,619][109198] Fps is (10 sec: 15564.9, 60 sec: 14745.6, 300 sec: 13070.0). Total num frames: 8269824. Throughput: 0: 1752.4, 1: 1881.6. Samples: 353371. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:01,620][109198] Avg episode reward: [(0, '3.949'), (1, '2.782')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:01,624][75052] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000651_2666496.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:01,624][74942] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001368_5603328.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:01,688][74942] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001054_4317184.pth\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:01,688][75052] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000341_1396736.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:05,101][75254] Large shaping reward 2.602 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 1.0), ('DAMAGECOUNT', 1.6, 160.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:06,278][75219] DAMAGECOUNT value on done: 725.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:06,278][75219] DAMAGECOUNT value on done: 685.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:06,279][75219] Sum rewards: 5.596, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.030', 'weapon2': '0.076', 'AMMO3': '0.123', 'AMMO4': '0.149', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'weapon4': '0.452', 'weapon5': '0.758', 'WEAPON3': '0.800', 'weapon3': '2.288', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.200'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:06,279][75219] Sum rewards: 5.183, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.019', 'weapon5': '0.020', 'weapon2': '0.052', 'AMMO3': '0.088', 'AMMO4': '0.093', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon4': '0.336', 'WEAPON3': '0.700', 'DAMAGECOUNT': '3.000', 'FRAGCOUNT': '3.000', 'weapon3': '3.260'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:06,400][75214] Updated weights for policy 0, policy_version 1377 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:06,619][109198] Fps is (10 sec: 15564.8, 60 sec: 14677.4, 300 sec: 13142.8). Total num frames: 8343552. Throughput: 0: 1774.1, 1: 1875.1. Samples: 370689. Policy #0 lag: (min: 0.0, avg: 0.8, max: 3.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:06,620][109198] Avg episode reward: [(0, '3.990'), (1, '2.782')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:06,784][75219] DAMAGECOUNT value on done: 555.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:06,784][75219] DAMAGECOUNT value on done: 448.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:06,784][75219] Sum rewards: 5.202, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.018', 'AMMO3': '0.040', 'AMMO4': '0.092', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.412', 'weapon4': '0.518', 'weapon2': '0.608', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.750', 'weapon3': '1.956'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:06,907][75209] Updated weights for policy 1, policy_version 661 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:07,921][75253] DAMAGECOUNT value on done: 360.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:07,922][75253] DAMAGECOUNT value on done: 181.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:07,922][75253] Sum rewards: 3.926, reward structure: {'HEALTH': '-0.310', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO3': '0.019', 'AMMO4': '0.050', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.296', 'weapon2': '0.448', 'weapon3': '0.962', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:08,410][75253] DAMAGECOUNT value on done: 565.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:08,410][75253] DAMAGECOUNT value on done: 569.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:08,411][75253] Sum rewards: 3.676, reward structure: {'HEALTH': '-1.650', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO4': '0.002', 'AMMO5': '0.007', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'weapon5': '0.286', 'WEAPON3': '0.400', 'weapon2': '0.876', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.390', 'weapon3': '2.124'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:09,096][75215] DAMAGECOUNT value on done: 301.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:09,097][75215] DAMAGECOUNT value on done: 130.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:09,097][75215] Sum rewards: 6.629, reward structure: {'HEALTH': '-0.250', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.716', 'FRAGCOUNT': '1.000', 'weapon3': '1.032', 'DAMAGECOUNT': '1.550', 'weapon5': '2.256'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:09,098][75215] Sum rewards: 0.688, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.010', 'AMMO4': '0.048', 'AMMO3': '0.048', 'weapon2': '0.054', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.250', 'weapon4': '0.342', 'WEAPON3': '0.400', 'weapon5': '1.368', 'weapon3': '1.860'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:09,441][75218] DAMAGECOUNT value on done: 125.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:09,442][75218] DAMAGECOUNT value on done: 322.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:09,442][75218] Sum rewards: 0.794, reward structure: {'HEALTH': '-2.680', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.024', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.059', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.268', 'weapon5': '0.498', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.950', 'weapon2': '1.092', 'weapon3': '1.828'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:09,443][75218] Sum rewards: 6.057, reward structure: {'HEALTH': '-0.950', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon5': '0.796', 'FRAGCOUNT': '1.000', 'weapon2': '1.056', 'weapon3': '1.232', 'DAMAGECOUNT': '2.570'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:09,642][75215] DAMAGECOUNT value on done: 522.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:09,642][75215] DAMAGECOUNT value on done: 595.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:09,643][75215] Sum rewards: 2.861, reward structure: {'HEALTH': '-3.350', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.019', 'weapon2': '0.068', 'AMMO4': '0.092', 'AMMO3': '0.115', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.466', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100', 'weapon3': '2.936'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:09,643][75215] Sum rewards: 7.292, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.013', 'AMMO5': '0.015', 'AMMO4': '0.065', 'AMMO3': '0.076', 'weapon2': '0.096', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.356', 'WEAPON3': '0.600', 'weapon5': '0.710', 'weapon3': '2.510', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.350'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:10,043][75218] DAMAGECOUNT value on done: 355.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:10,043][75218] DAMAGECOUNT value on done: 498.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:10,044][75218] Sum rewards: 4.358, reward structure: {'HEALTH': '-0.100', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.050', 'WEAPON4': '0.100', 'weapon2': '0.106', 'WEAPON3': '0.200', 'weapon4': '0.426', 'FRAGCOUNT': '1.000', 'weapon3': '1.066', 'DAMAGECOUNT': '1.480'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:10,078][75218] DAMAGECOUNT value on done: 353.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:10,078][75218] DAMAGECOUNT value on done: 320.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:10,078][75218] Sum rewards: 4.552, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.038', 'WEAPON5': '0.100', 'WEAPON3': '0.300', 'weapon2': '0.396', 'FRAGCOUNT': '1.000', 'weapon3': '1.106', 'DAMAGECOUNT': '1.200', 'weapon5': '2.438'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:10,079][75218] Sum rewards: 2.989, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'weapon2': '0.040', 'AMMO3': '0.060', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.414', 'WEAPON3': '0.500', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon5': '1.066', 'weapon3': '2.348'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:10,686][75218] DAMAGECOUNT value on done: 195.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:10,686][75218] DAMAGECOUNT value on done: 212.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:10,687][75218] Sum rewards: 2.249, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.004', 'AMMO4': '0.011', 'AMMO3': '0.043', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.276', 'weapon5': '0.388', 'WEAPON3': '0.400', 'weapon2': '0.422', 'DAMAGECOUNT': '0.950', 'weapon3': '1.604'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,145][75219] DAMAGECOUNT value on done: 376.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,145][75219] DAMAGECOUNT value on done: 640.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,146][75219] Sum rewards: 4.406, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.228', 'weapon2': '0.344', 'WEAPON3': '0.400', 'weapon5': '0.984', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.200', 'weapon3': '2.330'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,146][75219] Sum rewards: 3.188, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.015', 'AMMO4': '0.074', 'AMMO3': '0.075', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon2': '0.364', 'weapon5': '0.494', 'WEAPON3': '0.600', 'weapon4': '0.652', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.400', 'weapon3': '2.206'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,379][75217] DAMAGECOUNT value on done: 247.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,379][75217] DAMAGECOUNT value on done: 452.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,380][75217] Sum rewards: 3.069, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.037', 'AMMO4': '0.050', 'weapon2': '0.092', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.300', 'weapon4': '0.396', 'weapon5': '0.786', 'weapon3': '0.846', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.350'}\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:11,619][109198] Fps is (10 sec: 14745.6, 60 sec: 14745.6, 300 sec: 13209.6). Total num frames: 8417280. Throughput: 0: 1795.2, 1: 1873.0. Samples: 393218. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:11,620][109198] Avg episode reward: [(0, '4.011'), (1, '2.760')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,811][75219] DAMAGECOUNT value on done: 528.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,811][75219] DAMAGECOUNT value on done: 380.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,812][75219] Sum rewards: 2.650, reward structure: {'HEALTH': '-2.730', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'weapon5': '0.022', 'AMMO2': '0.028', 'AMMO3': '0.072', 'AMMO4': '0.140', 'WEAPON4': '0.200', 'weapon2': '0.232', 'weapon4': '0.292', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.750', 'weapon3': '2.728'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,812][75219] Sum rewards: 6.148, reward structure: {'HEALTH': '-1.750', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.228', 'weapon2': '0.310', 'WEAPON3': '0.400', 'weapon5': '1.160', 'FRAGCOUNT': '2.000', 'weapon3': '2.072', 'DAMAGECOUNT': '2.400'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,854][75253] DAMAGECOUNT value on done: 225.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,854][75253] DAMAGECOUNT value on done: 130.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,855][75253] Sum rewards: 2.618, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.050', 'AMMO4': '0.098', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon2': '0.124', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.400', 'weapon4': '0.602', 'weapon3': '1.376', 'weapon5': '1.544'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,928][75217] DAMAGECOUNT value on done: 160.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,928][75217] DAMAGECOUNT value on done: 342.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:11,929][75217] Sum rewards: 5.618, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.005', 'AMMO4': '0.025', 'AMMO3': '0.046', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.172', 'WEAPON3': '0.400', 'weapon2': '0.554', 'weapon5': '1.170', 'weapon3': '1.342', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.100'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:12,030][75214] Updated weights for policy 0, policy_version 1387 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:12,431][75217] DAMAGECOUNT value on done: 300.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:12,431][75217] DAMAGECOUNT value on done: 278.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:12,432][75217] Sum rewards: 4.174, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.049', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.408', 'weapon5': '0.536', 'weapon4': '0.562', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.140', 'weapon3': '1.824'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:12,432][75217] Sum rewards: 3.761, reward structure: {'HEALTH': '-1.270', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.007', 'AMMO4': '0.012', 'AMMO3': '0.047', 'weapon4': '0.084', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon2': '0.354', 'WEAPON3': '0.400', 'weapon5': '0.412', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon3': '2.262'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:12,491][75253] DAMAGECOUNT value on done: 237.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:12,492][75253] DAMAGECOUNT value on done: 80.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:12,704][75209] Updated weights for policy 1, policy_version 671 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:13,042][75217] DAMAGECOUNT value on done: 553.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:13,042][75217] Sum rewards: 7.248, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.015', 'weapon4': '0.062', 'AMMO3': '0.063', 'AMMO4': '0.075', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon2': '0.222', 'WEAPON3': '0.500', 'weapon5': '1.266', 'weapon3': '2.384', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.350'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:13,043][75217] DAMAGECOUNT value on done: 285.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:13,043][75217] Sum rewards: 3.290, reward structure: {'HEALTH': '-3.200', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.029', 'AMMO3': '0.069', 'AMMO4': '0.144', 'WEAPON4': '0.200', 'weapon4': '0.326', 'WEAPON5': '0.400', 'weapon2': '0.400', 'weapon5': '0.418', 'WEAPON3': '0.600', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150', 'weapon3': '2.734'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:13,327][75252] DAMAGECOUNT value on done: 472.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:13,328][75252] DAMAGECOUNT value on done: 392.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:13,328][75252] Sum rewards: 2.383, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.030', 'AMMO4': '0.099', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.388', 'DAMAGECOUNT': '0.550', 'weapon5': '0.616', 'weapon4': '0.772', 'weapon3': '1.304'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:13,835][75252] DAMAGECOUNT value on done: 123.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:13,835][75252] DAMAGECOUNT value on done: 155.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:13,836][75252] Sum rewards: 5.263, reward structure: {'HEALTH': '-0.450', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.025', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.123', 'weapon2': '0.148', 'WEAPON3': '0.200', 'weapon4': '0.536', 'weapon3': '0.932', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon5': '1.374'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:14,435][75252] DAMAGECOUNT value on done: 145.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:14,435][75252] DAMAGECOUNT value on done: 70.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:14,435][75252] Sum rewards: 6.037, reward structure: {'HEALTH': '-0.050', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'AMMO3': '0.020', 'AMMO4': '0.075', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.412', 'weapon2': '0.504', 'weapon3': '0.990', 'FRAGCOUNT': '1.000', 'weapon5': '1.266', 'DAMAGECOUNT': '1.400'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:15,036][75252] DAMAGECOUNT value on done: 469.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:15,036][75252] DAMAGECOUNT value on done: 429.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:15,036][75252] Sum rewards: 7.061, reward structure: {'HEALTH': '-2.600', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO2': '0.013', 'AMMO5': '0.015', 'AMMO4': '0.067', 'AMMO3': '0.071', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon5': '0.542', 'WEAPON3': '0.600', 'weapon4': '0.604', 'weapon3': '2.596', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.650'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:15,037][75252] Sum rewards: 3.641, reward structure: {'HEALTH': '-3.550', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'weapon5': '0.006', 'AMMO5': '0.020', 'weapon2': '0.022', 'AMMO2': '0.043', 'AMMO3': '0.108', 'AMMO4': '0.214', 'weapon4': '0.256', 'WEAPON4': '0.400', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.600', 'weapon3': '3.322'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:15,106][75216] DAMAGECOUNT value on done: 265.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:15,106][75216] DAMAGECOUNT value on done: 576.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:15,107][75216] Sum rewards: 3.102, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO5': '0.010', 'AMMO2': '0.029', 'AMMO3': '0.071', 'AMMO4': '0.146', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon4': '0.456', 'WEAPON3': '0.500', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.674', 'weapon5': '1.714'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:15,107][75216] Sum rewards: 6.521, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.025', 'AMMO3': '0.040', 'WEAPON5': '0.100', 'AMMO4': '0.123', 'WEAPON4': '0.200', 'weapon2': '0.262', 'WEAPON3': '0.400', 'weapon4': '0.646', 'weapon5': '0.908', 'weapon3': '1.762', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:15,685][75216] DAMAGECOUNT value on done: 550.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:15,685][75216] DAMAGECOUNT value on done: 421.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:15,686][75216] Sum rewards: 5.102, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.040', 'AMMO4': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon5': '0.206', 'WEAPON3': '0.400', 'weapon2': '0.660', 'weapon4': '0.706', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.800', 'weapon3': '1.866'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,197][75215] DAMAGECOUNT value on done: 205.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,197][75215] Sum rewards: 5.675, reward structure: {'HEALTH': '-0.900', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.424', 'FRAGCOUNT': '1.000', 'weapon3': '1.186', 'DAMAGECOUNT': '1.350', 'weapon5': '2.320'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,197][75215] DAMAGECOUNT value on done: 280.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,249][75216] DAMAGECOUNT value on done: 158.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,250][75216] DAMAGECOUNT value on done: 75.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,250][75216] Sum rewards: 2.839, reward structure: {'HEALTH': '-1.180', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'weapon2': '0.066', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.454', 'DAMAGECOUNT': '0.500', 'weapon5': '0.922', 'weapon3': '2.230'}\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:16,619][109198] Fps is (10 sec: 13926.3, 60 sec: 14540.8, 300 sec: 13205.5). Total num frames: 8482816. Throughput: 0: 1791.3, 1: 1851.4. Samples: 408795. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:16,620][109198] Avg episode reward: [(0, '4.011'), (1, '2.911')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,640][75052] Saving new best policy, reward=2.911!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,745][75254] DAMAGECOUNT value on done: 248.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,745][75254] DAMAGECOUNT value on done: 56.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,745][75254] Sum rewards: 3.601, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.010', 'AMMO3': '0.030', 'AMMO4': '0.050', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.402', 'weapon4': '0.494', 'weapon5': '0.536', 'FRAGCOUNT': '0.999', 'weapon3': '1.226', 'DAMAGECOUNT': '1.250'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,766][75215] DAMAGECOUNT value on done: 127.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,767][75215] DAMAGECOUNT value on done: 77.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,767][75215] Sum rewards: 2.221, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'DAMAGECOUNT': '0.020', 'AMMO2': '0.020', 'AMMO3': '0.056', 'AMMO4': '0.100', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon2': '0.220', 'WEAPON3': '0.400', 'weapon4': '0.610', 'weapon3': '0.974', 'weapon5': '1.412'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,840][75216] DAMAGECOUNT value on done: 315.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,841][75216] DAMAGECOUNT value on done: 429.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:16,841][75216] Sum rewards: 7.855, reward structure: {'HEALTH': '-0.900', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'weapon2': '0.054', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.342', 'weapon3': '1.224', 'FRAGCOUNT': '2.000', 'weapon5': '2.230', 'DAMAGECOUNT': '2.450'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:17,321][75254] DAMAGECOUNT value on done: 373.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:17,321][75254] DAMAGECOUNT value on done: 440.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:17,882][75254] DAMAGECOUNT value on done: 195.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:17,882][75254] DAMAGECOUNT value on done: 575.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:17,883][75254] Sum rewards: 1.709, reward structure: {'HEALTH': '-2.250', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.004', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO4': '0.025', 'AMMO3': '0.055', 'weapon5': '0.076', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon4': '0.492', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.696', 'DAMAGECOUNT': '1.800'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:17,883][75254] Sum rewards: 6.174, reward structure: {'HEALTH': '-1.750', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.020', 'AMMO2': '-0.004', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.039', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.224', 'weapon2': '0.316', 'WEAPON3': '0.400', 'weapon5': '1.028', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.300', 'weapon3': '2.330'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:18,029][75214] Updated weights for policy 0, policy_version 1397 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:18,462][75254] DAMAGECOUNT value on done: 225.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:18,462][75254] DAMAGECOUNT value on done: 330.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:18,463][75254] Sum rewards: 5.493, reward structure: {'HEALTH': '-0.200', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.358', 'FRAGCOUNT': '1.000', 'weapon5': '1.090', 'weapon3': '1.252', 'DAMAGECOUNT': '1.700'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:18,552][75209] Updated weights for policy 1, policy_version 681 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:21,619][109198] Fps is (10 sec: 13926.4, 60 sec: 14609.1, 300 sec: 13264.7). Total num frames: 8556544. Throughput: 0: 1814.5, 1: 1839.4. Samples: 424065. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:21,620][109198] Avg episode reward: [(0, '4.041'), (1, '2.891')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:23,946][75214] Updated weights for policy 0, policy_version 1407 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:24,545][75209] Updated weights for policy 1, policy_version 691 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:26,619][109198] Fps is (10 sec: 13926.4, 60 sec: 14404.3, 300 sec: 13258.9). Total num frames: 8622080. Throughput: 0: 1815.4, 1: 1814.5. Samples: 444428. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:26,620][109198] Avg episode reward: [(0, '4.041'), (1, '2.891')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:30,031][75214] Updated weights for policy 0, policy_version 1417 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:30,421][75209] Updated weights for policy 1, policy_version 701 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:31,619][109198] Fps is (10 sec: 13516.8, 60 sec: 14404.3, 300 sec: 13282.7). Total num frames: 8691712. Throughput: 0: 1811.5, 1: 1804.9. Samples: 459875. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:31,620][109198] Avg episode reward: [(0, '4.041'), (1, '2.891')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:35,420][75214] Updated weights for policy 0, policy_version 1427 (0.0016)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:35,924][75209] Updated weights for policy 1, policy_version 711 (0.0013)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:36,619][109198] Fps is (10 sec: 14336.0, 60 sec: 14472.5, 300 sec: 13333.2). Total num frames: 8765440. Throughput: 0: 1815.7, 1: 1814.0. Samples: 476554. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:36,620][109198] Avg episode reward: [(0, '4.041'), (1, '2.891')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:41,167][75214] Updated weights for policy 0, policy_version 1437 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:41,619][109198] Fps is (10 sec: 14336.1, 60 sec: 14404.3, 300 sec: 13353.0). Total num frames: 8835072. Throughput: 0: 1799.6, 1: 1799.2. Samples: 497996. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:41,620][109198] Avg episode reward: [(0, '4.041'), (1, '2.891')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:41,809][75209] Updated weights for policy 1, policy_version 721 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:42,740][109198] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 109198], exiting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:42,742][109198] Runner profile tree view:\n", + "main_loop: 158.9516\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,741][74942] Stopping Batcher_0...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:42,743][109198] Collected {0: 5894144, 1: 2957312}, FPS: 12704.0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,742][75052] Stopping Batcher_1...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,742][74942] Loop batcher_evt_loop terminating...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:42,743][74942] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001439_5894144.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,743][75052] Loop batcher_evt_loop terminating...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:39:42,744][75052] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000722_2957312.pth...\u001b[0m\n" + ] + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "\u001b[36m[2023-09-14 12:39:42,759][75209] Weights refcount: 2 0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,760][75209] Stopping InferenceWorker_p1-w0...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,761][75209] Loop inference_proc1-0_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,762][75214] Weights refcount: 2 0\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,763][75214] Stopping InferenceWorker_p0-w0...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,763][75214] Loop inference_proc0-0_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,802][74942] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001187_4861952.pth\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,803][75052] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000481_1970176.pth\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,809][74942] Stopping LearnerWorker_p0...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,809][74942] Loop learner_proc0_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,810][75052] Stopping LearnerWorker_p1...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:42,810][75052] Loop learner_proc1_evt_loop terminating...\u001b[0m\n", + "[W CudaIPCTypes.cpp:15] Producer process has been terminated before all shared CUDA tensors released. See Note [Sharing CUDA tensors]\n", + "[W CudaIPCTypes.cpp:15] Producer process has been terminated before all shared CUDA tensors released. See Note [Sharing CUDA tensors]\n", + "\u001b[36m[2023-09-14 12:39:43,547][75254] Stopping RolloutWorker_w7...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,547][75215] Stopping RolloutWorker_w1...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,548][75215] Loop rollout_proc1_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,548][75254] Loop rollout_proc7_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,549][75218] Stopping RolloutWorker_w3...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,550][75218] Loop rollout_proc3_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,550][75253] Stopping RolloutWorker_w6...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,551][75253] Loop rollout_proc6_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,553][75252] Stopping RolloutWorker_w5...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,554][75252] Loop rollout_proc5_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,554][75219] Stopping RolloutWorker_w4...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,556][75219] Loop rollout_proc4_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,558][75217] Stopping RolloutWorker_w2...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,558][75217] Loop rollout_proc2_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,569][75216] Stopping RolloutWorker_w0...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:39:43,570][75216] Loop rollout_proc0_evt_loop terminating...\u001b[0m\n" ] } ], "source": [ + "\n", "## Start the training, this should take around 15 minutes\n", "register_vizdoom_components()\n", "\n", "# The scenario we train on today is health gathering\n", "# other scenarios include \"doom_basic\", \"doom_two_colors_easy\", \"doom_dm\", \"doom_dwango5\", \"doom_my_way_home\", \"doom_deadly_corridor\", \"doom_defend_the_center\", \"doom_defend_the_line\", \"predict_position\", \"take_cover\"\n", - "env = \"doom_dwango5\"\n", + "env = \"doom_duel\"\n", "cfg = parse_vizdoom_cfg(\n", - " argv=[f\"--env={env}\", \"--num_workers=8\", \"--num_envs_per_worker=4\", \"--train_for_env_steps=1000000\"]\n", + " argv=[f\"--env={env}\", \"--num_workers=8\", \"--num_envs_per_worker=4\", \"--train_for_env_steps=10000000\"]\n", ")\n", "\n", "status = run_rl(cfg)" @@ -7025,52 +2313,532 @@ }, { "cell_type": "code", - "execution_count": 5, + "execution_count": 7, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ - "\u001b[33m[2023-09-12 21:01:01,865][28625] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,866][28625] Overriding arg 'num_workers' with value 1 passed from command line\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,867][28625] Adding new argument 'no_render'=True that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,869][28625] Adding new argument 'save_video'=True that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,870][28625] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,872][28625] Adding new argument 'video_name'=None that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,873][28625] Adding new argument 'max_num_frames'=1000000000.0 that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,875][28625] Adding new argument 'max_num_episodes'=10 that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,876][28625] Adding new argument 'push_to_hub'=False that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,877][28625] Adding new argument 'hf_repository'=None that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,877][28625] Adding new argument 'policy_index'=0 that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,878][28625] Adding new argument 'eval_deterministic'=False that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,879][28625] Adding new argument 'train_script'=None that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,879][28625] Adding new argument 'enjoy_script'=None that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,880][28625] Using frameskip 1 and render_action_repeat=4 for evaluation\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,881][28625] Multi agent env, num agents: 8\u001b[0m\n", + "\u001b[33m[2023-09-14 12:03:16,383][97397] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,385][97397] Overriding arg 'num_workers' with value 1 passed from command line\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,386][97397] Adding new argument 'no_render'=True that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,386][97397] Adding new argument 'save_video'=True that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,387][97397] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,387][97397] Adding new argument 'video_name'=None that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,388][97397] Adding new argument 'max_num_frames'=1000000000.0 that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,389][97397] Adding new argument 'max_num_episodes'=10 that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,389][97397] Adding new argument 'push_to_hub'=False that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,390][97397] Adding new argument 'hf_repository'=None that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,391][97397] Adding new argument 'policy_index'=0 that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,392][97397] Adding new argument 'eval_deterministic'=False that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,392][97397] Adding new argument 'train_script'=None that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,393][97397] Adding new argument 'enjoy_script'=None that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,394][97397] Using frameskip 1 and render_action_repeat=4 for evaluation\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,397][97397] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,424][97397] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.num_agents to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.num_agents` for environment variables or `env.get_wrapper_attr('num_agents')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.is_multiagent to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.is_multiagent` for environment variables or `env.get_wrapper_attr('is_multiagent')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[36m[2023-09-12 21:01:01,913][28625] RunningMeanStd input shape: (23,)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,914][28625] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,915][28625] RunningMeanStd input shape: (1,)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,927][28625] ConvEncoder: input_channels=3\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,971][28625] Conv encoder output size: 512\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,974][28625] Policy head output size: 640\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:02,005][28625] No checkpoints found\u001b[0m\n" + "\u001b[36m[2023-09-14 12:03:16,428][97397] RunningMeanStd input shape: (23,)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,429][97397] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,430][97397] RunningMeanStd input shape: (1,)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,443][97397] ConvEncoder: input_channels=3\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,582][97397] Conv encoder output size: 512\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,585][97397] Policy head output size: 640\u001b[0m\n", + "\u001b[33m[2023-09-14 12:03:17,532][97397] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000246_1007616.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:17,565][97397] Port 40300 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:17,567][97397] Using port 40300\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:17,568][97397] Initializing env for player 0, init_info: {'port': 40300}...\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:17,618][97397] Initializing env for player 1, init_info: {'port': 40300}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:17,668][97397] 2 agent workers initialized for env 0!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:17,670][97397] Using port 40300 on host...\u001b[0m\n", + "Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Contacting host: /Press 'Q' to abort network game synchronization.\n", + "Network game synchronization timeout: 4s.\n", + "Got connect from node 1. \n", + "Waiting for players: .. [ 2/ 2]\n", + "Sending all here. \n", + "\n", + "Total players: 2 \n", + "\n", + "Waiting for other players: .. [ 2/ 2]\n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", + "\n", + "Go \n", + "Total players: 2 \n", + "\n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", + "Received \"Go.\" \n", + "\n", + "Total players: 2 \n", + "\n", + "Found AI0_host (node 1, player 1) \n", + "Found AI1 (node 1, player 2) \n", + "Found AI1 (node 0, player 2) \n", + "\n", + "\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:18,724][97397] Initialized w:0 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:18,725][97397] Initialized w:0 v:0 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:19,234][97397] Num frames 100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:19,470][97397] Num frames 200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:19,714][97397] Num frames 300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:19,959][97397] Num frames 400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:20,180][97397] Num frames 500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:20,428][97397] Num frames 600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:20,660][97397] Num frames 700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:20,937][97397] Num frames 800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:21,231][97397] Num frames 900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:21,512][97397] Num frames 1000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:21,784][97397] Num frames 1100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:22,030][97397] Num frames 1200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:22,268][97397] Num frames 1300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:22,512][97397] Num frames 1400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:22,757][97397] Num frames 1500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:22,995][97397] Num frames 1600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:23,221][97397] Num frames 1700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:23,437][97397] Num frames 1800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:23,659][97397] Num frames 1900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:23,896][97397] Num frames 2000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:24,135][97397] Num frames 2100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:24,426][97397] Num frames 2200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:24,679][97397] Num frames 2300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:24,943][97397] Num frames 2400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:25,201][97397] Num frames 2500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:25,501][97397] Num frames 2600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:25,739][97397] Num frames 2700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:25,997][97397] Num frames 2800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:26,227][97397] Num frames 2900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:26,464][97397] Num frames 3000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:26,699][97397] Num frames 3100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:26,942][97397] Num frames 3200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:27,198][97397] Num frames 3300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:27,465][97397] Num frames 3400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:27,710][97397] Num frames 3500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:27,951][97397] Num frames 3600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:28,225][97397] Num frames 3700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:28,516][97397] Num frames 3800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:28,765][97397] Num frames 3900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:29,034][97397] Num frames 4000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:29,303][97397] Num frames 4100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:29,566][97397] Num frames 4200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:29,808][97397] Num frames 4300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:30,057][97397] Num frames 4400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:30,295][97397] Num frames 4500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:30,535][97397] Num frames 4600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:30,782][97397] Num frames 4700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:31,013][97397] Num frames 4800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:31,286][97397] Num frames 4900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:31,539][97397] Num frames 5000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:31,791][97397] Num frames 5100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:32,037][97397] Num frames 5200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:32,298][97397] Num frames 5300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:32,537][97397] Num frames 5400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:32,805][97397] Num frames 5500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:33,061][97397] Num frames 5600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:33,340][97397] Num frames 5700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:33,586][97397] Num frames 5800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:33,817][97397] Num frames 5900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:34,076][97397] Num frames 6000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:34,392][97397] Num frames 6100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:34,637][97397] Num frames 6200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:34,906][97397] Num frames 6300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:35,135][97397] Num frames 6400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:35,393][97397] Num frames 6500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:35,640][97397] Num frames 6600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:35,896][97397] Num frames 6700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:36,136][97397] Num frames 6800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:36,355][97397] Num frames 6900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:36,596][97397] Num frames 7000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:36,863][97397] Num frames 7100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:37,149][97397] Num frames 7200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:37,424][97397] Num frames 7300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:37,691][97397] Num frames 7400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:37,951][97397] Num frames 7500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:38,265][97397] Num frames 7600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:38,525][97397] Num frames 7700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:38,763][97397] Num frames 7800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:38,998][97397] Num frames 7900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:39,260][97397] Num frames 8000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:39,544][97397] Num frames 8100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:39,816][97397] Num frames 8200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:40,090][97397] Num frames 8300...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:40,347][97397] DAMAGECOUNT value on done: 0.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:40,347][97397] DAMAGECOUNT value on done: 12.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:40,349][97397] Sum rewards: 14.318, reward structure: {'HEALTH': '-1.120', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.003', 'AMMO2': '0.014', 'AMMO3': '0.040', 'AMMO4': '0.069', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.400', 'weapon5': '0.574', 'weapon4': '0.602', 'weapon2': '1.536', 'weapon3': '13.002'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:40,416][97397] Avg episode rewards: #0: 10.216, #1: 14.318, true rewards: #0: 1.000, #1: 0.000\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:40,418][97397] Avg episode reward: 12.267, avg true_objective: 0.500\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:40,425][97397] Num frames 8400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:40,697][97397] Num frames 8500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:40,965][97397] Num frames 8600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:41,246][97397] Num frames 8700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:41,492][97397] Num frames 8800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:41,750][97397] Num frames 8900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:41,980][97397] Num frames 9000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:42,252][97397] Num frames 9100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:42,507][97397] Num frames 9200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:42,768][97397] Num frames 9300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:43,083][97397] Num frames 9400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:43,342][97397] Num frames 9500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:43,577][97397] Num frames 9600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:43,847][97397] Num frames 9700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:44,132][97397] Num frames 9800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:44,614][97397] Num frames 9900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:44,935][97397] Num frames 10000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:45,280][97397] Num frames 10100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:45,680][97397] Num frames 10200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:45,980][97397] Num frames 10300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:46,271][97397] Num frames 10400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:46,586][97397] Num frames 10500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:47,011][97397] Num frames 10600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:47,368][97397] Num frames 10700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:47,759][97397] Num frames 10800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:48,043][97397] Num frames 10900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:48,392][97397] Num frames 11000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:48,754][97397] Num frames 11100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:49,028][97397] Num frames 11200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:49,362][97397] Num frames 11300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:49,662][97397] Num frames 11400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:49,936][97397] Num frames 11500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:50,173][97397] Num frames 11600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:50,426][97397] Num frames 11700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:50,689][97397] Num frames 11800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:51,025][97397] Num frames 11900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:51,312][97397] Num frames 12000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:51,569][97397] Num frames 12100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:51,833][97397] Num frames 12200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:52,066][97397] Num frames 12300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:52,306][97397] Num frames 12400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:52,541][97397] Num frames 12500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:52,842][97397] Num frames 12600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:53,109][97397] Num frames 12700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:53,358][97397] Num frames 12800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:53,661][97397] Num frames 12900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:53,950][97397] Num frames 13000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:54,218][97397] Num frames 13100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:54,507][97397] Num frames 13200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:54,814][97397] Num frames 13300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:55,075][97397] Num frames 13400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:55,346][97397] Num frames 13500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:55,638][97397] Num frames 13600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:55,960][97397] Num frames 13700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:56,267][97397] Num frames 13800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:56,540][97397] Num frames 13900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:56,852][97397] Num frames 14000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:57,123][97397] Num frames 14100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:57,382][97397] Num frames 14200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:57,680][97397] Num frames 14300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:57,960][97397] Num frames 14400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:58,234][97397] Num frames 14500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:58,529][97397] Num frames 14600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:58,825][97397] Num frames 14700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:59,128][97397] Num frames 14800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:59,445][97397] Num frames 14900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:59,717][97397] Num frames 15000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:59,982][97397] Num frames 15100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:00,232][97397] Num frames 15200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:00,507][97397] Num frames 15300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:00,764][97397] Num frames 15400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:01,001][97397] Num frames 15500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:01,293][97397] Num frames 15600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:01,557][97397] Num frames 15700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:01,944][97397] Num frames 15800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:02,232][97397] Num frames 15900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:02,472][97397] Num frames 16000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:02,712][97397] Num frames 16100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:02,938][97397] Num frames 16200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:03,185][97397] Num frames 16300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:03,427][97397] Num frames 16400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:03,697][97397] Num frames 16500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:03,945][97397] Num frames 16600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:04,170][97397] Num frames 16700...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:04,458][97397] DAMAGECOUNT value on done: 45.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:04,458][97397] DAMAGECOUNT value on done: 37.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:04,460][97397] Sum rewards: 14.910, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.025', 'AMMO3': '0.040', 'AMMO4': '0.123', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.450', 'weapon5': '0.666', 'weapon2': '0.872', 'weapon4': '1.078', 'weapon3': '12.950'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:04,523][97397] Avg episode rewards: #0: 11.004, #1: 14.613, true rewards: #0: 1.000, #1: 0.000\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:04,524][97397] Avg episode reward: 12.809, avg true_objective: 0.500\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:04,537][97397] Num frames 16800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:04,881][97397] Num frames 16900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:05,221][97397] Num frames 17000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:05,516][97397] Num frames 17100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:05,777][97397] Num frames 17200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:06,013][97397] Num frames 17300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:06,260][97397] Num frames 17400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:06,504][97397] Num frames 17500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:06,754][97397] Num frames 17600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:07,073][97397] Num frames 17700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:07,350][97397] Num frames 17800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:07,602][97397] Num frames 17900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:07,903][97397] Num frames 18000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:08,237][97397] Num frames 18100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:08,546][97397] Num frames 18200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:08,776][97397] Num frames 18300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:09,022][97397] Num frames 18400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:09,275][97397] Num frames 18500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:09,543][97397] Num frames 18600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:09,797][97397] Num frames 18700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:10,062][97397] Num frames 18800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:10,307][97397] Num frames 18900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:10,568][97397] Num frames 19000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:10,864][97397] Num frames 19100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:11,098][97397] Num frames 19200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:11,396][97397] Num frames 19300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:11,632][97397] Num frames 19400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:11,889][97397] Num frames 19500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:12,112][97397] Num frames 19600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:12,361][97397] Num frames 19700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:12,616][97397] Num frames 19800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:12,868][97397] Num frames 19900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:13,164][97397] Num frames 20000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:13,401][97397] Num frames 20100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:13,650][97397] Num frames 20200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:13,878][97397] Num frames 20300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:14,130][97397] Num frames 20400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:14,401][97397] Num frames 20500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:14,646][97397] Num frames 20600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:14,916][97397] Num frames 20700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:15,199][97397] Num frames 20800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:15,466][97397] Num frames 20900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:15,720][97397] Num frames 21000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:15,953][97397] Num frames 21100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:16,210][97397] Num frames 21200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:16,473][97397] Num frames 21300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:16,712][97397] Num frames 21400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:16,936][97397] Num frames 21500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:17,181][97397] Num frames 21600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:17,431][97397] Num frames 21700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:17,711][97397] Num frames 21800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:17,973][97397] Num frames 21900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:18,290][97397] Num frames 22000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:18,536][97397] Num frames 22100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:18,792][97397] Num frames 22200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:19,032][97397] Num frames 22300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:19,304][97397] Num frames 22400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:19,551][97397] Num frames 22500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:19,780][97397] Num frames 22600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:20,016][97397] Num frames 22700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:20,259][97397] Num frames 22800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:20,493][97397] Num frames 22900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:20,774][97397] Num frames 23000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:21,015][97397] Num frames 23100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:21,284][97397] Num frames 23200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:21,520][97397] Num frames 23300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:21,777][97397] Num frames 23400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:22,013][97397] Num frames 23500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:22,246][97397] Num frames 23600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:22,481][97397] Num frames 23700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:22,716][97397] Num frames 23800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:22,938][97397] Num frames 23900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:23,165][97397] Num frames 24000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:23,417][97397] Num frames 24100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:23,651][97397] Num frames 24200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:23,888][97397] Num frames 24300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:24,136][97397] Num frames 24400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:24,426][97397] Num frames 24500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:24,698][97397] Num frames 24600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:24,977][97397] Num frames 24700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:25,257][97397] Num frames 24800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:25,561][97397] Num frames 24900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:25,820][97397] Num frames 25000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:26,061][97397] Num frames 25100...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:26,287][97397] DAMAGECOUNT value on done: 57.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:26,287][97397] DAMAGECOUNT value on done: 92.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:26,289][97397] Sum rewards: 9.675, reward structure: {'HEALTH': '-1.470', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.194', 'WEAPON3': '0.200', 'DAMAGECOUNT': '0.200', 'FRAGCOUNT': '0.999', 'weapon4': '1.842', 'weapon3': '3.908', 'weapon2': '4.548'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:26,349][97397] Avg episode rewards: #0: 10.561, #1: 14.175, true rewards: #0: 0.667, #1: 0.000\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:26,350][97397] Avg episode reward: 12.368, avg true_objective: 0.333\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:26,366][97397] Num frames 25200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:26,632][97397] Num frames 25300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:26,901][97397] Num frames 25400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:27,185][97397] Num frames 25500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:27,438][97397] Num frames 25600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:27,679][97397] Num frames 25700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:27,927][97397] Num frames 25800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:28,205][97397] Num frames 25900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:28,498][97397] Num frames 26000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:28,782][97397] Num frames 26100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:29,072][97397] Num frames 26200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:29,342][97397] Num frames 26300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:29,583][97397] Num frames 26400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:29,847][97397] Num frames 26500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:30,142][97397] Num frames 26600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:30,414][97397] Num frames 26700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:30,661][97397] Num frames 26800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:30,920][97397] Num frames 26900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:31,202][97397] Num frames 27000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:31,434][97397] Num frames 27100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:31,674][97397] Num frames 27200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:31,932][97397] Num frames 27300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:32,167][97397] Num frames 27400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:32,386][97397] Num frames 27500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:32,608][97397] Num frames 27600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:32,825][97397] Num frames 27700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:33,072][97397] Num frames 27800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:33,312][97397] Num frames 27900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:33,547][97397] Num frames 28000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:33,792][97397] Num frames 28100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:34,030][97397] Num frames 28200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:34,284][97397] Num frames 28300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:34,553][97397] Num frames 28400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:34,800][97397] Num frames 28500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:35,057][97397] Num frames 28600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:35,314][97397] Num frames 28700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:35,562][97397] Num frames 28800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:35,795][97397] Num frames 28900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:36,036][97397] Num frames 29000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:36,266][97397] Num frames 29100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:36,503][97397] Num frames 29200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:36,746][97397] Num frames 29300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:36,998][97397] Num frames 29400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:37,247][97397] Num frames 29500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:37,505][97397] Num frames 29600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:37,756][97397] Num frames 29700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:38,028][97397] Num frames 29800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:38,291][97397] Num frames 29900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:38,536][97397] Num frames 30000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:38,793][97397] Num frames 30100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:39,048][97397] Num frames 30200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:39,301][97397] Num frames 30300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:39,549][97397] Num frames 30400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:39,782][97397] Num frames 30500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:40,014][97397] Num frames 30600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:40,252][97397] Num frames 30700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:40,496][97397] Num frames 30800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:40,722][97397] Num frames 30900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:40,973][97397] Num frames 31000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:41,282][97397] Num frames 31100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:41,538][97397] Num frames 31200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:41,780][97397] Num frames 31300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:42,016][97397] Num frames 31400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:42,248][97397] Num frames 31500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:42,486][97397] Num frames 31600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:42,725][97397] Num frames 31700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:42,998][97397] Num frames 31800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:43,261][97397] Num frames 31900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:43,498][97397] Num frames 32000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:43,801][97397] Num frames 32100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:44,104][97397] Num frames 32200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:44,403][97397] Num frames 32300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:44,690][97397] Num frames 32400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:44,949][97397] Num frames 32500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:45,237][97397] Num frames 32600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:45,499][97397] Num frames 32700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:45,739][97397] Num frames 32800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:45,990][97397] Num frames 32900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:46,252][97397] Num frames 33000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:46,510][97397] Num frames 33100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:46,742][97397] Num frames 33200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:47,033][97397] Num frames 33300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:47,284][97397] Num frames 33400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:47,556][97397] Num frames 33500...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:47,799][97397] DAMAGECOUNT value on done: 342.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:47,800][97397] DAMAGECOUNT value on done: 107.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:47,801][97397] Sum rewards: 19.276, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.011', 'AMMO3': '0.040', 'AMMO4': '0.056', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.374', 'WEAPON3': '0.400', 'weapon4': '1.230', 'weapon2': '1.394', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.850', 'weapon3': '12.764'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:47,863][97397] Avg episode rewards: #0: 12.740, #1: 12.316, true rewards: #0: 0.750, #1: 0.000\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:47,865][97397] Avg episode reward: 12.528, avg true_objective: 0.375\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:47,884][97397] Num frames 33600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:48,124][97397] Num frames 33700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:48,385][97397] Num frames 33800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:48,615][97397] Num frames 33900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:48,862][97397] Num frames 34000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:49,148][97397] Num frames 34100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:49,425][97397] Num frames 34200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:49,708][97397] Num frames 34300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:49,987][97397] Num frames 34400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:50,243][97397] Num frames 34500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:50,486][97397] Num frames 34600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:50,725][97397] Num frames 34700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:50,991][97397] Num frames 34800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:51,270][97397] Num frames 34900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:51,520][97397] Num frames 35000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:51,790][97397] Num frames 35100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:52,028][97397] Num frames 35200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:52,275][97397] Num frames 35300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:52,520][97397] Num frames 35400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:52,760][97397] Num frames 35500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:52,998][97397] Num frames 35600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:53,236][97397] Num frames 35700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:53,470][97397] Num frames 35800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:53,703][97397] Num frames 35900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:53,944][97397] Num frames 36000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:54,174][97397] Num frames 36100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:54,436][97397] Num frames 36200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:54,682][97397] Num frames 36300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:54,947][97397] Num frames 36400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:55,210][97397] Num frames 36500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:55,472][97397] Num frames 36600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:55,704][97397] Num frames 36700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:55,952][97397] Num frames 36800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:56,178][97397] Num frames 36900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:56,405][97397] Num frames 37000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:56,635][97397] Num frames 37100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:56,856][97397] Num frames 37200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:57,121][97397] Num frames 37300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:57,391][97397] Num frames 37400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:57,621][97397] Num frames 37500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:57,859][97397] Num frames 37600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:58,130][97397] Num frames 37700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:58,382][97397] Num frames 37800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:58,604][97397] Num frames 37900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:58,870][97397] Num frames 38000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:59,131][97397] Num frames 38100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:59,383][97397] Num frames 38200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:59,626][97397] Num frames 38300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:59,862][97397] Num frames 38400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:00,101][97397] Num frames 38500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:00,343][97397] Num frames 38600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:00,567][97397] Num frames 38700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:00,801][97397] Num frames 38800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:01,050][97397] Num frames 38900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:01,337][97397] Num frames 39000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:01,608][97397] Num frames 39100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:01,865][97397] Num frames 39200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:02,116][97397] Num frames 39300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:02,357][97397] Num frames 39400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:02,605][97397] Num frames 39500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:02,832][97397] Num frames 39600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:03,081][97397] Num frames 39700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:03,342][97397] Num frames 39800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:03,623][97397] Num frames 39900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:03,923][97397] Num frames 40000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:04,190][97397] Num frames 40100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:04,551][97397] Num frames 40200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:04,831][97397] Num frames 40300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:05,082][97397] Num frames 40400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:05,341][97397] Num frames 40500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:05,629][97397] Num frames 40600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:05,874][97397] Num frames 40700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:06,146][97397] Num frames 40800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:06,386][97397] Num frames 40900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:06,633][97397] Num frames 41000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:06,869][97397] Num frames 41100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:07,142][97397] Num frames 41200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:07,416][97397] Num frames 41300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:07,719][97397] Num frames 41400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:07,962][97397] Num frames 41500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:08,222][97397] Num frames 41600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:08,472][97397] Num frames 41700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:08,727][97397] Num frames 41800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:08,963][97397] Num frames 41900...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:05:09,207][97397] DAMAGECOUNT value on done: 442.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:05:09,207][97397] DAMAGECOUNT value on done: 282.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:05:09,208][97397] Sum rewards: 12.061, reward structure: {'HEALTH': '-2.400', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.004', 'AMMO4': '0.020', 'AMMO3': '0.050', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.400', 'weapon5': '0.556', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon4': '1.958', 'weapon2': '2.464', 'weapon3': '8.806'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:05:09,209][97397] Sum rewards: 11.181, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO4': '0.025', 'AMMO3': '0.037', 'WEAPON4': '0.100', 'WEAPON3': '0.300', 'weapon4': '0.702', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.750', 'weapon2': '3.640', 'weapon3': '5.622'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:05:09,273][97397] Avg episode rewards: #0: 12.604, #1: 12.089, true rewards: #0: 0.600, #1: 0.200\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:05:09,275][97397] Avg episode reward: 12.346, avg true_objective: 0.400\u001b[0m\n" ] }, { - "ename": "TypeError", - "evalue": "'NoneType' object is not subscriptable", + "ename": "", + "evalue": "", "output_type": "error", "traceback": [ - "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", - "\u001b[0;31mTypeError\u001b[0m Traceback (most recent call last)", - "Cell \u001b[0;32mIn[5], line 6\u001b[0m\n\u001b[1;32m 1\u001b[0m \u001b[38;5;28;01mfrom\u001b[39;00m \u001b[38;5;21;01msample_factory\u001b[39;00m\u001b[38;5;21;01m.\u001b[39;00m\u001b[38;5;21;01menjoy\u001b[39;00m \u001b[38;5;28;01mimport\u001b[39;00m enjoy\n\u001b[1;32m 3\u001b[0m cfg \u001b[38;5;241m=\u001b[39m parse_vizdoom_cfg(\n\u001b[1;32m 4\u001b[0m argv\u001b[38;5;241m=\u001b[39m[\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m--env=\u001b[39m\u001b[38;5;132;01m{\u001b[39;00menv\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m--num_workers=1\u001b[39m\u001b[38;5;124m\"\u001b[39m, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m--save_video\u001b[39m\u001b[38;5;124m\"\u001b[39m, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m--no_render\u001b[39m\u001b[38;5;124m\"\u001b[39m, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m--max_num_episodes=10\u001b[39m\u001b[38;5;124m\"\u001b[39m], evaluation\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m\n\u001b[1;32m 5\u001b[0m )\n\u001b[0;32m----> 6\u001b[0m status \u001b[38;5;241m=\u001b[39m \u001b[43menjoy\u001b[49m\u001b[43m(\u001b[49m\u001b[43mcfg\u001b[49m\u001b[43m)\u001b[49m\n", - "File \u001b[0;32m~/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/enjoy.py:125\u001b[0m, in \u001b[0;36menjoy\u001b[0;34m(cfg)\u001b[0m\n\u001b[1;32m 123\u001b[0m checkpoints \u001b[38;5;241m=\u001b[39m Learner\u001b[38;5;241m.\u001b[39mget_checkpoints(Learner\u001b[38;5;241m.\u001b[39mcheckpoint_dir(cfg, policy_id), \u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;132;01m{\u001b[39;00mname_prefix\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m_*\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m 124\u001b[0m checkpoint_dict \u001b[38;5;241m=\u001b[39m Learner\u001b[38;5;241m.\u001b[39mload_checkpoint(checkpoints, device)\n\u001b[0;32m--> 125\u001b[0m actor_critic\u001b[38;5;241m.\u001b[39mload_state_dict(\u001b[43mcheckpoint_dict\u001b[49m\u001b[43m[\u001b[49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[38;5;124;43mmodel\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[43m]\u001b[49m)\n\u001b[1;32m 127\u001b[0m episode_rewards \u001b[38;5;241m=\u001b[39m [deque([], maxlen\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m100\u001b[39m) \u001b[38;5;28;01mfor\u001b[39;00m _ \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mrange\u001b[39m(env\u001b[38;5;241m.\u001b[39mnum_agents)]\n\u001b[1;32m 128\u001b[0m true_objectives \u001b[38;5;241m=\u001b[39m [deque([], maxlen\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m100\u001b[39m) \u001b[38;5;28;01mfor\u001b[39;00m _ \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mrange\u001b[39m(env\u001b[38;5;241m.\u001b[39mnum_agents)]\n", - "\u001b[0;31mTypeError\u001b[0m: 'NoneType' object is not subscriptable" + "\u001b[1;31mThe Kernel crashed while executing code in the the current cell or a previous cell. Please review the code in the cell(s) to identify a possible cause of the failure. Click here for more info. View Jupyter log for further details." ] } ], @@ -7106,9 +2874,24 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 1, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "8e0e4af164c84f76a7d7ed1ec726fc6b", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "VBox(children=(HTML(value='
#0:0 (mpeg4 (native) -> h264 (libx264))\n", + "Press [q] to stop, [?] for help\n", + "[libx264 @ 0x5626da87f0c0] using SAR=1/1\n", + "[libx264 @ 0x5626da87f0c0] using cpu capabilities: MMX2 SSE2Fast SSSE3 SSE4.2 AVX FMA3 BMI2 AVX2 AVX512\n", + "[libx264 @ 0x5626da87f0c0] profile High, level 2.1\n", + "[libx264 @ 0x5626da87f0c0] 264 - core 155 r2917 0a84d98 - H.264/MPEG-4 AVC codec - Copyleft 2003-2018 - http://www.videolan.org/x264.html - options: cabac=1 ref=3 deblock=1:0:0 analyse=0x3:0x113 me=hex subme=7 psy=1 psy_rd=1.00:0.00 mixed_ref=1 me_range=16 chroma_me=1 trellis=1 8x8dct=1 cqm=0 deadzone=21,11 fast_pskip=1 chroma_qp_offset=-2 threads=6 lookahead_threads=1 sliced_threads=0 nr=0 decimate=1 interlaced=0 bluray_compat=0 constrained_intra=0 bframes=3 b_pyramid=2 b_adapt=1 b_bias=0 direct=1 weightb=1 open_gop=0 weightp=2 keyint=250 keyint_min=25 scenecut=40 intra_refresh=0 rc_lookahead=40 rc=crf mbtree=1 crf=23.0 qcomp=0.60 qpmin=0 qpmax=69 qpstep=4 ip_ratio=1.40 aq=1:1.00\n", + "Output #0, mp4, to '/home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/replay.mp4':\n", + " Metadata:\n", + " major_brand : isom\n", + " minor_version : 512\n", + " compatible_brands: isomiso2mp41\n", + " encoder : Lavf58.29.100\n", + " Stream #0:0(und): Video: h264 (libx264) (avc1 / 0x31637661), yuv420p, 640x180 [SAR 1:1 DAR 32:9], q=-1--1, 35 fps, 17920 tbn, 35 tbc (default)\n", + " Metadata:\n", + " handler_name : VideoHandler\n", + " encoder : Lavc58.54.100 libx264\n", + " Side data:\n", + " cpb: bitrate max/min/avg: 0/0/0 buffer size: 0 vbv_delay: -1\n", + "frame=42000 fps=222 q=-1.0 Lsize= 222449kB time=00:19:59.91 bitrate=1518.7kbits/s speed=6.35x \n", + "video:221954kB audio:0kB subtitle:0kB other streams:0kB global headers:0kB muxing overhead: 0.222909%\n", + "[libx264 @ 0x5626da87f0c0] frame I:188 Avg QP:24.95 size: 18260\n", + "[libx264 @ 0x5626da87f0c0] frame P:10663 Avg QP:28.28 size: 6691\n", + "[libx264 @ 0x5626da87f0c0] frame B:31149 Avg QP:30.26 size: 4896\n", + "[libx264 @ 0x5626da87f0c0] consecutive B-frames: 0.9% 0.3% 1.0% 97.8%\n", + "[libx264 @ 0x5626da87f0c0] mb I I16..4: 0.5% 68.5% 31.0%\n", + "[libx264 @ 0x5626da87f0c0] mb P I16..4: 0.7% 34.8% 7.6% P16..4: 20.3% 14.7% 5.3% 0.0% 0.0% skip:16.6%\n", + "[libx264 @ 0x5626da87f0c0] mb B I16..4: 0.3% 11.5% 2.0% B16..8: 31.8% 19.1% 5.6% direct: 7.8% skip:21.9% L0:49.4% L1:41.6% BI: 9.0%\n", + "[libx264 @ 0x5626da87f0c0] 8x8 transform intra:81.7% inter:65.2%\n", + "[libx264 @ 0x5626da87f0c0] coded y,uvDC,uvAC intra: 93.5% 59.2% 24.3% inter: 51.7% 20.9% 2.0%\n", + "[libx264 @ 0x5626da87f0c0] i16 v,h,dc,p: 36% 42% 9% 12%\n", + "[libx264 @ 0x5626da87f0c0] i8 v,h,dc,ddl,ddr,vr,hd,vl,hu: 12% 20% 29% 6% 6% 5% 7% 6% 10%\n", + "[libx264 @ 0x5626da87f0c0] i4 v,h,dc,ddl,ddr,vr,hd,vl,hu: 21% 27% 17% 6% 7% 5% 6% 4% 7%\n", + "[libx264 @ 0x5626da87f0c0] i8c dc,h,v,p: 60% 22% 15% 3%\n", + "[libx264 @ 0x5626da87f0c0] Weighted P-Frames: Y:0.0% UV:0.0%\n", + "[libx264 @ 0x5626da87f0c0] ref P L0: 42.0% 12.5% 26.4% 19.1%\n", + "[libx264 @ 0x5626da87f0c0] ref B L0: 79.5% 15.0% 5.5%\n", + "[libx264 @ 0x5626da87f0c0] ref B L1: 92.0% 8.0%\n", + "[libx264 @ 0x5626da87f0c0] kb/s:1515.20\n", + "\u001b[36m[2023-09-14 12:13:05,845][109198] Replay video saved to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/replay.mp4!\u001b[0m\n" ] }, { - "ename": "TypeError", - "evalue": "'NoneType' object is not subscriptable", - "output_type": "error", - "traceback": [ - "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", - "\u001b[0;31mTypeError\u001b[0m Traceback (most recent call last)", - "Cell \u001b[0;32mIn[8], line 18\u001b[0m\n\u001b[1;32m 3\u001b[0m hf_username \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mMattStammers\u001b[39m\u001b[38;5;124m\"\u001b[39m \u001b[38;5;66;03m# insert your HuggingFace username here\u001b[39;00m\n\u001b[1;32m 5\u001b[0m cfg \u001b[38;5;241m=\u001b[39m parse_vizdoom_cfg(\n\u001b[1;32m 6\u001b[0m argv\u001b[38;5;241m=\u001b[39m[\n\u001b[1;32m 7\u001b[0m \u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m--env=\u001b[39m\u001b[38;5;132;01m{\u001b[39;00menv\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m,\n\u001b[0;32m (...)\u001b[0m\n\u001b[1;32m 16\u001b[0m evaluation\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m,\n\u001b[1;32m 17\u001b[0m )\n\u001b[0;32m---> 18\u001b[0m status \u001b[38;5;241m=\u001b[39m \u001b[43menjoy\u001b[49m\u001b[43m(\u001b[49m\u001b[43mcfg\u001b[49m\u001b[43m)\u001b[49m\n", - "File \u001b[0;32m~/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/enjoy.py:125\u001b[0m, in \u001b[0;36menjoy\u001b[0;34m(cfg)\u001b[0m\n\u001b[1;32m 123\u001b[0m checkpoints \u001b[38;5;241m=\u001b[39m Learner\u001b[38;5;241m.\u001b[39mget_checkpoints(Learner\u001b[38;5;241m.\u001b[39mcheckpoint_dir(cfg, policy_id), \u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;132;01m{\u001b[39;00mname_prefix\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m_*\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m 124\u001b[0m checkpoint_dict \u001b[38;5;241m=\u001b[39m Learner\u001b[38;5;241m.\u001b[39mload_checkpoint(checkpoints, device)\n\u001b[0;32m--> 125\u001b[0m actor_critic\u001b[38;5;241m.\u001b[39mload_state_dict(\u001b[43mcheckpoint_dict\u001b[49m\u001b[43m[\u001b[49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[38;5;124;43mmodel\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[43m]\u001b[49m)\n\u001b[1;32m 127\u001b[0m episode_rewards \u001b[38;5;241m=\u001b[39m [deque([], maxlen\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m100\u001b[39m) \u001b[38;5;28;01mfor\u001b[39;00m _ \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mrange\u001b[39m(env\u001b[38;5;241m.\u001b[39mnum_agents)]\n\u001b[1;32m 128\u001b[0m true_objectives \u001b[38;5;241m=\u001b[39m [deque([], maxlen\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m100\u001b[39m) \u001b[38;5;28;01mfor\u001b[39;00m _ \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mrange\u001b[39m(env\u001b[38;5;241m.\u001b[39mnum_agents)]\n", - "\u001b[0;31mTypeError\u001b[0m: 'NoneType' object is not subscriptable" - ] + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "7d9510d5704c43da8efc6ee2be949f0a", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "events.out.tfevents.1694539452.rhmmedcatt-ProLiant-ML350-Gen10: 0%| | 0.00/92.3k [00:00 --algo=APPO --env=doom_health_gathering_supreme --train_dir=./train_dir --experiment=rl_course_vizdoom_health_gathering_supreme --``` -- -- --You can also upload models to the Hugging Face Hub using the same script with the `--push_to_hub` flag. --See https://www.samplefactory.dev/10-huggingface/huggingface/ for more details -- --## Training with this model -- --To continue training with this model, use the `train` script corresponding to this environment: --``` --python -m --algo=APPO --env=doom_health_gathering_supreme --train_dir=./train_dir --experiment=rl_course_vizdoom_health_gathering_supreme --restart_behavior=resume --train_for_env_steps=10000000000 --``` -- --Note, you may have to adjust `--train_for_env_steps` to a su \ No newline at end of file diff --git a/environments/sample_factory/train_dir/default_experiment/sf_log.txt b/environments/sample_factory/train_dir/default_experiment/sf_log.txt index 4a0823e..ce66ef1 100644 --- a/environments/sample_factory/train_dir/default_experiment/sf_log.txt +++ b/environments/sample_factory/train_dir/default_experiment/sf_log.txt @@ -6141,3 +6141,12701 @@ main_loop: 1780.8502 [2023-09-12 21:31:31,121][39698] Loop rollout_proc3_evt_loop terminating... [2023-09-12 21:31:31,150][39696] Stopping RolloutWorker_w2... [2023-09-12 21:31:31,151][39696] Loop rollout_proc2_evt_loop terminating... +[2023-09-14 11:22:10,759][97397] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... +[2023-09-14 11:22:10,907][97397] Rollout worker 0 uses device cpu +[2023-09-14 11:22:10,908][97397] Rollout worker 1 uses device cpu +[2023-09-14 11:22:10,910][97397] Rollout worker 2 uses device cpu +[2023-09-14 11:22:10,912][97397] Rollout worker 3 uses device cpu +[2023-09-14 11:22:10,913][97397] Rollout worker 4 uses device cpu +[2023-09-14 11:22:10,914][97397] Rollout worker 5 uses device cpu +[2023-09-14 11:22:10,916][97397] Rollout worker 6 uses device cpu +[2023-09-14 11:22:10,917][97397] Rollout worker 7 uses device cpu +[2023-09-14 11:22:11,107][97397] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:22:11,108][97397] InferenceWorker_p0-w0: min num requests: 2 +[2023-09-14 11:22:11,134][97397] Starting all processes... +[2023-09-14 11:22:11,135][97397] Starting process learner_proc0 +[2023-09-14 11:22:12,719][97397] Starting all processes... +[2023-09-14 11:22:12,721][98257] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:22:12,721][98257] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 +[2023-09-14 11:22:12,726][97397] Starting process inference_proc0-0 +[2023-09-14 11:22:12,727][97397] Starting process rollout_proc0 +[2023-09-14 11:22:12,727][97397] Starting process rollout_proc1 +[2023-09-14 11:22:12,739][98257] Num visible devices: 1 +[2023-09-14 11:22:12,727][97397] Starting process rollout_proc2 +[2023-09-14 11:22:12,763][98257] Starting seed is not provided +[2023-09-14 11:22:12,764][98257] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:22:12,728][97397] Starting process rollout_proc3 +[2023-09-14 11:22:12,764][98257] Initializing actor-critic model on device cuda:0 +[2023-09-14 11:22:12,764][98257] RunningMeanStd input shape: (23,) +[2023-09-14 11:22:12,765][98257] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 11:22:12,729][97397] Starting process rollout_proc4 +[2023-09-14 11:22:12,765][98257] RunningMeanStd input shape: (1,) +[2023-09-14 11:22:12,729][97397] Starting process rollout_proc5 +[2023-09-14 11:22:12,730][97397] Starting process rollout_proc6 +[2023-09-14 11:22:12,731][97397] Starting process rollout_proc7 +[2023-09-14 11:22:12,777][98257] ConvEncoder: input_channels=3 +[2023-09-14 11:22:12,983][98257] Conv encoder output size: 512 +[2023-09-14 11:22:12,984][98257] Policy head output size: 640 +[2023-09-14 11:22:13,002][98257] Created Actor Critic model with architecture: +[2023-09-14 11:22:13,002][98257] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (measurements): RunningMeanStdInPlace() + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): VizdoomEncoder( + (basic_encoder): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ELU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ELU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ELU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ELU) + ) + ) + ) + (measurements_head): Sequential( + (0): Linear(in_features=23, out_features=128, bias=True) + (1): ELU(alpha=1.0) + (2): Linear(in_features=128, out_features=128, bias=True) + (3): ELU(alpha=1.0) + ) + ) + (core): ModelCoreRNN( + (core): GRU(640, 512) + ) + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=15, bias=True) + ) +) +[2023-09-14 11:22:14,067][98257] Using optimizer +[2023-09-14 11:22:14,068][98257] No checkpoints found +[2023-09-14 11:22:14,068][98257] Did not load from checkpoint, starting from scratch! +[2023-09-14 11:22:14,068][98257] Initialized policy 0 weights for model version 0 +[2023-09-14 11:22:14,070][98257] LearnerWorker_p0 finished initialization! +[2023-09-14 11:22:14,070][98257] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:22:14,564][98391] Worker 1 uses CPU cores [4, 5, 6, 7] +[2023-09-14 11:22:14,571][98395] Worker 2 uses CPU cores [8, 9, 10, 11] +[2023-09-14 11:22:14,572][98394] Worker 3 uses CPU cores [12, 13, 14, 15] +[2023-09-14 11:22:14,595][98397] Worker 5 uses CPU cores [20, 21, 22, 23] +[2023-09-14 11:22:14,607][98398] Worker 7 uses CPU cores [28, 29, 30, 31] +[2023-09-14 11:22:14,630][98396] Worker 4 uses CPU cores [16, 17, 18, 19] +[2023-09-14 11:22:14,798][98399] Worker 6 uses CPU cores [24, 25, 26, 27] +[2023-09-14 11:22:14,827][98390] Worker 0 uses CPU cores [0, 1, 2, 3] +[2023-09-14 11:22:14,843][98392] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:22:14,843][98392] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 +[2023-09-14 11:22:14,861][98392] Num visible devices: 1 +[2023-09-14 11:22:15,459][98392] RunningMeanStd input shape: (23,) +[2023-09-14 11:22:15,460][98392] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 11:22:15,460][98392] RunningMeanStd input shape: (1,) +[2023-09-14 11:22:15,472][98392] ConvEncoder: input_channels=3 +[2023-09-14 11:22:15,582][98392] Conv encoder output size: 512 +[2023-09-14 11:22:15,583][98392] Policy head output size: 640 +[2023-09-14 11:22:15,867][97397] Inference worker 0-0 is ready! +[2023-09-14 11:22:15,869][97397] All inference workers are ready! Signal rollout workers to start! +[2023-09-14 11:22:15,872][98397] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,873][98399] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,874][98391] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,874][98395] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,875][98394] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,875][98398] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,875][98396] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,875][98390] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,902][98397] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:22:15,904][98399] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:22:15,905][98397] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,907][98399] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,908][98395] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:22:15,908][98396] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:22:15,909][98398] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:22:15,909][98390] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:22:15,909][98391] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:22:15,910][98394] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:22:15,911][98395] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,912][98396] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,912][98398] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,912][98390] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,913][98394] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,917][98391] Multi agent env, num agents: 8 +[2023-09-14 11:22:15,936][98397] Port 40800 is available +[2023-09-14 11:22:15,936][98397] Using port 40800 +[2023-09-14 11:22:15,938][98397] Initializing env for player 0, init_info: {'port': 40800}... +[2023-09-14 11:22:15,938][98399] Port 40900 is available +[2023-09-14 11:22:15,938][98399] Using port 40900 +[2023-09-14 11:22:15,940][98399] Initializing env for player 0, init_info: {'port': 40900}... +[2023-09-14 11:22:15,942][98395] Port 40500 is available +[2023-09-14 11:22:15,942][98395] Using port 40500 +[2023-09-14 11:22:15,943][98395] Initializing env for player 0, init_info: {'port': 40500}... +[2023-09-14 11:22:15,943][98396] Port 40700 is available +[2023-09-14 11:22:15,944][98396] Using port 40700 +[2023-09-14 11:22:15,944][98398] Port 41000 is available +[2023-09-14 11:22:15,944][98390] Port 40300 is available +[2023-09-14 11:22:15,944][98398] Using port 41000 +[2023-09-14 11:22:15,944][98390] Using port 40300 +[2023-09-14 11:22:15,944][98396] Initializing env for player 0, init_info: {'port': 40700}... +[2023-09-14 11:22:15,945][98390] Initializing env for player 0, init_info: {'port': 40300}... +[2023-09-14 11:22:15,945][98394] Port 40600 is available +[2023-09-14 11:22:15,946][98394] Using port 40600 +[2023-09-14 11:22:15,946][98394] Initializing env for player 0, init_info: {'port': 40600}... +[2023-09-14 11:22:15,949][98391] Port 40400 is available +[2023-09-14 11:22:15,949][98391] Using port 40400 +[2023-09-14 11:22:15,950][98391] Initializing env for player 0, init_info: {'port': 40400}... +[2023-09-14 11:22:15,966][98397] Using port 40800 on host... +[2023-09-14 11:22:15,972][98395] Using port 40500 on host... +[2023-09-14 11:22:15,973][98390] Using port 40300 on host... +[2023-09-14 11:22:15,974][98399] Using port 40900 on host... +[2023-09-14 11:22:15,975][98394] Using port 40600 on host... +[2023-09-14 11:22:15,979][98396] Using port 40700 on host... +[2023-09-14 11:22:15,984][98391] Using port 40400 on host... +[2023-09-14 11:22:15,988][98397] Initializing env for player 1, init_info: {'port': 40800}... +[2023-09-14 11:22:15,990][98399] Initializing env for player 1, init_info: {'port': 40900}... +[2023-09-14 11:22:15,993][98395] Initializing env for player 1, init_info: {'port': 40500}... +[2023-09-14 11:22:15,995][98396] Initializing env for player 1, init_info: {'port': 40700}... +[2023-09-14 11:22:15,995][98390] Initializing env for player 1, init_info: {'port': 40300}... +[2023-09-14 11:22:15,997][98394] Initializing env for player 1, init_info: {'port': 40600}... +[2023-09-14 11:22:16,000][98391] Initializing env for player 1, init_info: {'port': 40400}... +[2023-09-14 11:22:16,041][98399] Initializing env for player 2, init_info: {'port': 40900}... +[2023-09-14 11:22:16,042][98397] Initializing env for player 2, init_info: {'port': 40800}... +[2023-09-14 11:22:16,048][98394] Initializing env for player 2, init_info: {'port': 40600}... +[2023-09-14 11:22:16,048][98395] Initializing env for player 2, init_info: {'port': 40500}... +[2023-09-14 11:22:16,046][98390] Initializing env for player 2, init_info: {'port': 40300}... +[2023-09-14 11:22:16,051][98391] Initializing env for player 2, init_info: {'port': 40400}... +[2023-09-14 11:22:16,046][98396] Initializing env for player 2, init_info: {'port': 40700}... +[2023-09-14 11:22:16,097][98390] Initializing env for player 3, init_info: {'port': 40300}... +[2023-09-14 11:22:16,092][98399] Initializing env for player 3, init_info: {'port': 40900}... +[2023-09-14 11:22:16,099][98397] Initializing env for player 3, init_info: {'port': 40800}... +[2023-09-14 11:22:16,099][98394] Initializing env for player 3, init_info: {'port': 40600}... +[2023-09-14 11:22:16,100][98396] Initializing env for player 3, init_info: {'port': 40700}... +[2023-09-14 11:22:16,098][98395] Initializing env for player 3, init_info: {'port': 40500}... +[2023-09-14 11:22:16,106][98391] Initializing env for player 3, init_info: {'port': 40400}... +[2023-09-14 11:22:16,144][98399] Initializing env for player 4, init_info: {'port': 40900}... +[2023-09-14 11:22:16,146][98396] Initializing env for player 4, init_info: {'port': 40700}... +[2023-09-14 11:22:16,151][98397] Initializing env for player 4, init_info: {'port': 40800}... +[2023-09-14 11:22:16,155][98394] Initializing env for player 4, init_info: {'port': 40600}... +[2023-09-14 11:22:16,155][98395] Initializing env for player 4, init_info: {'port': 40500}... +[2023-09-14 11:22:16,162][98390] Initializing env for player 4, init_info: {'port': 40300}... +[2023-09-14 11:22:16,167][98391] Initializing env for player 4, init_info: {'port': 40400}... +[2023-09-14 11:22:16,199][98396] Initializing env for player 5, init_info: {'port': 40700}... +[2023-09-14 11:22:16,203][98399] Initializing env for player 5, init_info: {'port': 40900}... +[2023-09-14 11:22:16,203][98397] Initializing env for player 5, init_info: {'port': 40800}... +[2023-09-14 11:22:16,205][98394] Initializing env for player 5, init_info: {'port': 40600}... +[2023-09-14 11:22:16,207][98395] Initializing env for player 5, init_info: {'port': 40500}... +[2023-09-14 11:22:16,218][98391] Initializing env for player 5, init_info: {'port': 40400}... +[2023-09-14 11:22:16,223][98390] Initializing env for player 5, init_info: {'port': 40300}... +[2023-09-14 11:22:16,251][98399] Initializing env for player 6, init_info: {'port': 40900}... +[2023-09-14 11:22:16,253][98396] Initializing env for player 6, init_info: {'port': 40700}... +[2023-09-14 11:22:16,259][98394] Initializing env for player 6, init_info: {'port': 40600}... +[2023-09-14 11:22:16,263][98397] Initializing env for player 6, init_info: {'port': 40800}... +[2023-09-14 11:22:16,266][98391] Initializing env for player 6, init_info: {'port': 40400}... +[2023-09-14 11:22:16,271][98395] Initializing env for player 6, init_info: {'port': 40500}... +[2023-09-14 11:22:16,289][98390] Initializing env for player 6, init_info: {'port': 40300}... +[2023-09-14 11:22:16,307][98397] Initializing env for player 7, init_info: {'port': 40800}... +[2023-09-14 11:22:16,316][98394] Initializing env for player 7, init_info: {'port': 40600}... +[2023-09-14 11:22:16,316][98396] Initializing env for player 7, init_info: {'port': 40700}... +[2023-09-14 11:22:16,319][98399] Initializing env for player 7, init_info: {'port': 40900}... +[2023-09-14 11:22:16,323][98391] Initializing env for player 7, init_info: {'port': 40400}... +[2023-09-14 11:22:16,331][98395] Initializing env for player 7, init_info: {'port': 40500}... +[2023-09-14 11:22:16,347][98390] Initializing env for player 7, init_info: {'port': 40300}... +[2023-09-14 11:22:17,031][97397] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 0. Throughput: 0: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:22:17,703][98394] Initialized w:3 v:0 player:5 +[2023-09-14 11:22:17,704][98394] Initialized w:3 v:0 player:3 +[2023-09-14 11:22:17,705][98394] Initialized w:3 v:0 player:4 +[2023-09-14 11:22:17,705][98394] Initialized w:3 v:0 player:6 +[2023-09-14 11:22:17,705][98394] Initialized w:3 v:0 player:1 +[2023-09-14 11:22:17,705][98394] Initialized w:3 v:0 player:2 +[2023-09-14 11:22:17,705][98394] Initialized w:3 v:0 player:7 +[2023-09-14 11:22:17,706][98394] Initialized w:3 v:0 player:0 +[2023-09-14 11:22:17,708][98394] 8 agent workers initialized for env 3! +[2023-09-14 11:22:17,753][98394] Decorrelating experience for 0 frames... +[2023-09-14 11:22:17,755][98394] Port 40601 is available +[2023-09-14 11:22:17,755][98394] Using port 40601 +[2023-09-14 11:22:17,755][98394] Initializing env for player 0, init_info: {'port': 40601}... +[2023-09-14 11:22:17,774][98396] Initialized w:4 v:0 player:7 +[2023-09-14 11:22:17,774][98396] Initialized w:4 v:0 player:0 +[2023-09-14 11:22:17,776][98396] Initialized w:4 v:0 player:2 +[2023-09-14 11:22:17,776][98396] Initialized w:4 v:0 player:5 +[2023-09-14 11:22:17,776][98396] Initialized w:4 v:0 player:1 +[2023-09-14 11:22:17,777][98396] Initialized w:4 v:0 player:3 +[2023-09-14 11:22:17,777][98396] Initialized w:4 v:0 player:6 +[2023-09-14 11:22:17,777][98396] Initialized w:4 v:0 player:4 +[2023-09-14 11:22:17,780][98396] 8 agent workers initialized for env 4! +[2023-09-14 11:22:17,787][98394] Using port 40601 on host... +[2023-09-14 11:22:17,806][98394] Initializing env for player 1, init_info: {'port': 40601}... +[2023-09-14 11:22:17,823][98396] Decorrelating experience for 0 frames... +[2023-09-14 11:22:17,825][98396] Port 40701 is available +[2023-09-14 11:22:17,825][98396] Using port 40701 +[2023-09-14 11:22:17,825][98396] Initializing env for player 0, init_info: {'port': 40701}... +[2023-09-14 11:22:17,851][98395] Initialized w:2 v:0 player:5 +[2023-09-14 11:22:17,852][98395] Initialized w:2 v:0 player:4 +[2023-09-14 11:22:17,853][98395] Initialized w:2 v:0 player:2 +[2023-09-14 11:22:17,853][98395] Initialized w:2 v:0 player:0 +[2023-09-14 11:22:17,853][98395] Initialized w:2 v:0 player:1 +[2023-09-14 11:22:17,854][98395] Initialized w:2 v:0 player:6 +[2023-09-14 11:22:17,854][98395] Initialized w:2 v:0 player:3 +[2023-09-14 11:22:17,855][98395] Initialized w:2 v:0 player:7 +[2023-09-14 11:22:17,856][98394] Initializing env for player 2, init_info: {'port': 40601}... +[2023-09-14 11:22:17,857][98395] 8 agent workers initialized for env 2! +[2023-09-14 11:22:17,868][98399] Initialized w:6 v:0 player:5 +[2023-09-14 11:22:17,869][98396] Using port 40701 on host... +[2023-09-14 11:22:17,870][98399] Initialized w:6 v:0 player:0 +[2023-09-14 11:22:17,871][98399] Initialized w:6 v:0 player:6 +[2023-09-14 11:22:17,871][98399] Initialized w:6 v:0 player:2 +[2023-09-14 11:22:17,871][98399] Initialized w:6 v:0 player:7 +[2023-09-14 11:22:17,877][98399] Initialized w:6 v:0 player:3 +[2023-09-14 11:22:17,879][98396] Initializing env for player 1, init_info: {'port': 40701}... +[2023-09-14 11:22:17,879][98399] Initialized w:6 v:0 player:1 +[2023-09-14 11:22:17,894][98395] Decorrelating experience for 0 frames... +[2023-09-14 11:22:17,890][98390] Initialized w:0 v:0 player:6 +[2023-09-14 11:22:17,896][98395] Port 40501 is available +[2023-09-14 11:22:17,895][98390] Initialized w:0 v:0 player:7 +[2023-09-14 11:22:17,896][98395] Using port 40501 +[2023-09-14 11:22:17,895][98390] Initialized w:0 v:0 player:3 +[2023-09-14 11:22:17,895][98390] Initialized w:0 v:0 player:4 +[2023-09-14 11:22:17,897][98395] Initializing env for player 0, init_info: {'port': 40501}... +[2023-09-14 11:22:17,895][98390] Initialized w:0 v:0 player:0 +[2023-09-14 11:22:17,896][98390] Initialized w:0 v:0 player:1 +[2023-09-14 11:22:17,896][98390] Initialized w:0 v:0 player:2 +[2023-09-14 11:22:17,906][98394] Initializing env for player 3, init_info: {'port': 40601}... +[2023-09-14 11:22:17,907][98397] Initialized w:5 v:0 player:2 +[2023-09-14 11:22:17,908][98397] Initialized w:5 v:0 player:3 +[2023-09-14 11:22:17,909][98397] Initialized w:5 v:0 player:0 +[2023-09-14 11:22:17,909][98397] Initialized w:5 v:0 player:1 +[2023-09-14 11:22:17,910][98397] Initialized w:5 v:0 player:5 +[2023-09-14 11:22:17,911][98397] Initialized w:5 v:0 player:6 +[2023-09-14 11:22:17,915][98397] Initialized w:5 v:0 player:7 +[2023-09-14 11:22:17,926][98395] Using port 40501 on host... +[2023-09-14 11:22:17,928][98391] Initialized w:1 v:0 player:7 +[2023-09-14 11:22:17,929][98396] Initializing env for player 2, init_info: {'port': 40701}... +[2023-09-14 11:22:17,929][98391] Initialized w:1 v:0 player:0 +[2023-09-14 11:22:17,929][98391] Initialized w:1 v:0 player:5 +[2023-09-14 11:22:17,930][98391] Initialized w:1 v:0 player:6 +[2023-09-14 11:22:17,930][98391] Initialized w:1 v:0 player:3 +[2023-09-14 11:22:17,930][98391] Initialized w:1 v:0 player:4 +[2023-09-14 11:22:17,930][98391] Initialized w:1 v:0 player:2 +[2023-09-14 11:22:17,931][98391] Initialized w:1 v:0 player:1 +[2023-09-14 11:22:17,933][98391] 8 agent workers initialized for env 1! +[2023-09-14 11:22:17,947][98395] Initializing env for player 1, init_info: {'port': 40501}... +[2023-09-14 11:22:17,961][98394] Initializing env for player 4, init_info: {'port': 40601}... +[2023-09-14 11:22:17,971][98391] Decorrelating experience for 0 frames... +[2023-09-14 11:22:17,973][98391] Port 40401 is available +[2023-09-14 11:22:17,973][98391] Using port 40401 +[2023-09-14 11:22:17,979][98396] Initializing env for player 3, init_info: {'port': 40701}... +[2023-09-14 11:22:17,999][98395] Initializing env for player 2, init_info: {'port': 40501}... +[2023-09-14 11:22:18,027][98394] Initializing env for player 5, init_info: {'port': 40601}... +[2023-09-14 11:22:18,032][98396] Initializing env for player 4, init_info: {'port': 40701}... +[2023-09-14 11:22:18,048][98395] Initializing env for player 3, init_info: {'port': 40501}... +[2023-09-14 11:22:18,071][98394] Initializing env for player 6, init_info: {'port': 40601}... +[2023-09-14 11:22:18,086][98396] Initializing env for player 5, init_info: {'port': 40701}... +[2023-09-14 11:22:18,107][98395] Initializing env for player 4, init_info: {'port': 40501}... +[2023-09-14 11:22:18,123][98394] Initializing env for player 7, init_info: {'port': 40601}... +[2023-09-14 11:22:18,139][98396] Initializing env for player 6, init_info: {'port': 40701}... +[2023-09-14 11:22:18,175][98395] Initializing env for player 5, init_info: {'port': 40501}... +[2023-09-14 11:22:18,191][98396] Initializing env for player 7, init_info: {'port': 40701}... +[2023-09-14 11:22:18,246][98395] Initializing env for player 6, init_info: {'port': 40501}... +[2023-09-14 11:22:18,293][98395] Initializing env for player 7, init_info: {'port': 40501}... +[2023-09-14 11:22:18,866][98399] Initialized w:6 v:0 player:4 +[2023-09-14 11:22:18,867][98399] 8 agent workers initialized for env 6! +[2023-09-14 11:22:18,883][98391] Initializing env for player 0, init_info: {'port': 40401}... +[2023-09-14 11:22:18,918][98391] Using port 40401 on host... +[2023-09-14 11:22:18,934][98391] Initializing env for player 1, init_info: {'port': 40401}... +[2023-09-14 11:22:18,936][98399] Decorrelating experience for 0 frames... +[2023-09-14 11:22:18,937][98399] Port 40901 is available +[2023-09-14 11:22:18,937][98399] Using port 40901 +[2023-09-14 11:22:18,938][98399] Initializing env for player 0, init_info: {'port': 40901}... +[2023-09-14 11:22:18,966][98399] Using port 40901 on host... +[2023-09-14 11:22:18,984][98391] Initializing env for player 2, init_info: {'port': 40401}... +[2023-09-14 11:22:18,988][98399] Initializing env for player 1, init_info: {'port': 40901}... +[2023-09-14 11:22:19,036][98391] Initializing env for player 3, init_info: {'port': 40401}... +[2023-09-14 11:22:19,040][98399] Initializing env for player 2, init_info: {'port': 40901}... +[2023-09-14 11:22:19,092][98391] Initializing env for player 4, init_info: {'port': 40401}... +[2023-09-14 11:22:19,099][98399] Initializing env for player 3, init_info: {'port': 40901}... +[2023-09-14 11:22:19,147][98391] Initializing env for player 5, init_info: {'port': 40401}... +[2023-09-14 11:22:19,199][98391] Initializing env for player 6, init_info: {'port': 40401}... +[2023-09-14 11:22:19,155][98399] Initializing env for player 4, init_info: {'port': 40901}... +[2023-09-14 11:22:19,207][98399] Initializing env for player 5, init_info: {'port': 40901}... +[2023-09-14 11:22:19,259][98399] Initializing env for player 6, init_info: {'port': 40901}... +[2023-09-14 11:22:19,259][98391] Initializing env for player 7, init_info: {'port': 40401}... +[2023-09-14 11:22:19,311][98399] Initializing env for player 7, init_info: {'port': 40901}... +[2023-09-14 11:22:19,391][98394] Initialized w:3 v:1 player:0 +[2023-09-14 11:22:19,392][98394] Initialized w:3 v:1 player:4 +[2023-09-14 11:22:19,393][98394] Initialized w:3 v:1 player:5 +[2023-09-14 11:22:19,393][98394] Initialized w:3 v:1 player:3 +[2023-09-14 11:22:19,394][98394] Initialized w:3 v:1 player:1 +[2023-09-14 11:22:19,394][98394] Initialized w:3 v:1 player:2 +[2023-09-14 11:22:19,394][98394] Initialized w:3 v:1 player:6 +[2023-09-14 11:22:19,394][98394] Initialized w:3 v:1 player:7 +[2023-09-14 11:22:19,396][98394] 8 agent workers initialized for env 3! +[2023-09-14 11:22:19,432][98394] Decorrelating experience for 32 frames... +[2023-09-14 11:22:19,515][98396] Initialized w:4 v:1 player:6 +[2023-09-14 11:22:19,518][98396] Initialized w:4 v:1 player:7 +[2023-09-14 11:22:19,518][98396] Initialized w:4 v:1 player:3 +[2023-09-14 11:22:19,519][98396] Initialized w:4 v:1 player:1 +[2023-09-14 11:22:19,519][98396] Initialized w:4 v:1 player:4 +[2023-09-14 11:22:19,519][98396] Initialized w:4 v:1 player:5 +[2023-09-14 11:22:19,519][98396] Initialized w:4 v:1 player:0 +[2023-09-14 11:22:19,519][98396] Initialized w:4 v:1 player:2 +[2023-09-14 11:22:19,522][98396] 8 agent workers initialized for env 4! +[2023-09-14 11:22:19,559][98395] Initialized w:2 v:1 player:3 +[2023-09-14 11:22:19,561][98395] Initialized w:2 v:1 player:1 +[2023-09-14 11:22:19,562][98395] Initialized w:2 v:1 player:5 +[2023-09-14 11:22:19,562][98395] Initialized w:2 v:1 player:4 +[2023-09-14 11:22:19,562][98395] Initialized w:2 v:1 player:6 +[2023-09-14 11:22:19,563][98395] Initialized w:2 v:1 player:2 +[2023-09-14 11:22:19,563][98395] Initialized w:2 v:1 player:7 +[2023-09-14 11:22:19,563][98395] Initialized w:2 v:1 player:0 +[2023-09-14 11:22:19,566][98395] 8 agent workers initialized for env 2! +[2023-09-14 11:22:19,576][98396] Decorrelating experience for 32 frames... +[2023-09-14 11:22:19,616][98395] Decorrelating experience for 32 frames... +[2023-09-14 11:22:19,863][98394] Multi agent env, num agents: 8 +[2023-09-14 11:22:19,899][98395] Multi agent env, num agents: 8 +[2023-09-14 11:22:19,908][98394] Multi agent env, num agents: 8 +[2023-09-14 11:22:19,934][98395] Multi agent env, num agents: 8 +[2023-09-14 11:22:19,944][98394] Port 40602 is available +[2023-09-14 11:22:19,944][98394] Using port 40602 +[2023-09-14 11:22:19,945][98394] Initializing env for player 0, init_info: {'port': 40602}... +[2023-09-14 11:22:19,954][98396] Multi agent env, num agents: 8 +[2023-09-14 11:22:19,964][98395] Port 40502 is available +[2023-09-14 11:22:19,965][98395] Using port 40502 +[2023-09-14 11:22:19,965][98395] Initializing env for player 0, init_info: {'port': 40502}... +[2023-09-14 11:22:19,973][98394] Using port 40602 on host... +[2023-09-14 11:22:19,995][98394] Initializing env for player 1, init_info: {'port': 40602}... +[2023-09-14 11:22:20,000][98395] Using port 40502 on host... +[2023-09-14 11:22:20,001][98396] Multi agent env, num agents: 8 +[2023-09-14 11:22:20,016][98395] Initializing env for player 1, init_info: {'port': 40502}... +[2023-09-14 11:22:20,046][98394] Initializing env for player 2, init_info: {'port': 40602}... +[2023-09-14 11:22:20,048][98396] Port 40702 is available +[2023-09-14 11:22:20,048][98396] Using port 40702 +[2023-09-14 11:22:20,049][98396] Initializing env for player 0, init_info: {'port': 40702}... +[2023-09-14 11:22:20,066][98395] Initializing env for player 2, init_info: {'port': 40502}... +[2023-09-14 11:22:20,083][98396] Using port 40702 on host... +[2023-09-14 11:22:20,099][98394] Initializing env for player 3, init_info: {'port': 40602}... +[2023-09-14 11:22:20,100][98396] Initializing env for player 1, init_info: {'port': 40702}... +[2023-09-14 11:22:20,119][98395] Initializing env for player 3, init_info: {'port': 40502}... +[2023-09-14 11:22:20,150][98396] Initializing env for player 2, init_info: {'port': 40702}... +[2023-09-14 11:22:20,151][98394] Initializing env for player 4, init_info: {'port': 40602}... +[2023-09-14 11:22:20,168][98395] Initializing env for player 4, init_info: {'port': 40502}... +[2023-09-14 11:22:20,203][98396] Initializing env for player 3, init_info: {'port': 40702}... +[2023-09-14 11:22:20,216][98394] Initializing env for player 5, init_info: {'port': 40602}... +[2023-09-14 11:22:20,219][98395] Initializing env for player 5, init_info: {'port': 40502}... +[2023-09-14 11:22:20,255][98394] Initializing env for player 6, init_info: {'port': 40602}... +[2023-09-14 11:22:20,256][98396] Initializing env for player 4, init_info: {'port': 40702}... +[2023-09-14 11:22:20,271][98395] Initializing env for player 6, init_info: {'port': 40502}... +[2023-09-14 11:22:20,307][98394] Initializing env for player 7, init_info: {'port': 40602}... +[2023-09-14 11:22:20,309][98396] Initializing env for player 5, init_info: {'port': 40702}... +[2023-09-14 11:22:20,333][98395] Initializing env for player 7, init_info: {'port': 40502}... +[2023-09-14 11:22:20,359][98396] Initializing env for player 6, init_info: {'port': 40702}... +[2023-09-14 11:22:20,411][98396] Initializing env for player 7, init_info: {'port': 40702}... +[2023-09-14 11:22:20,578][98399] Initialized w:6 v:1 player:4 +[2023-09-14 11:22:20,580][98399] Initialized w:6 v:1 player:0 +[2023-09-14 11:22:20,580][98399] Initialized w:6 v:1 player:7 +[2023-09-14 11:22:20,582][98399] Initialized w:6 v:1 player:1 +[2023-09-14 11:22:20,582][98399] Initialized w:6 v:1 player:5 +[2023-09-14 11:22:20,582][98399] Initialized w:6 v:1 player:2 +[2023-09-14 11:22:20,582][98399] Initialized w:6 v:1 player:6 +[2023-09-14 11:22:20,583][98399] Initialized w:6 v:1 player:3 +[2023-09-14 11:22:20,585][98399] 8 agent workers initialized for env 6! +[2023-09-14 11:22:20,642][98399] Decorrelating experience for 32 frames... +[2023-09-14 11:22:20,687][98391] Initialized w:1 v:1 player:7 +[2023-09-14 11:22:20,689][98391] Initialized w:1 v:1 player:3 +[2023-09-14 11:22:20,690][98391] Initialized w:1 v:1 player:6 +[2023-09-14 11:22:20,691][98391] Initialized w:1 v:1 player:1 +[2023-09-14 11:22:20,692][98391] Initialized w:1 v:1 player:2 +[2023-09-14 11:22:20,693][98391] Initialized w:1 v:1 player:4 +[2023-09-14 11:22:20,694][98391] Initialized w:1 v:1 player:0 +[2023-09-14 11:22:20,695][98391] Initialized w:1 v:1 player:5 +[2023-09-14 11:22:20,695][98391] 8 agent workers initialized for env 1! +[2023-09-14 11:22:20,829][98391] Decorrelating experience for 32 frames... +[2023-09-14 11:22:20,982][98399] Multi agent env, num agents: 8 +[2023-09-14 11:22:21,018][98399] Multi agent env, num agents: 8 +[2023-09-14 11:22:21,048][98399] Port 40902 is available +[2023-09-14 11:22:21,048][98399] Using port 40902 +[2023-09-14 11:22:21,226][98391] Multi agent env, num agents: 8 +[2023-09-14 11:22:21,272][98391] Multi agent env, num agents: 8 +[2023-09-14 11:22:21,319][98391] Port 40402 is available +[2023-09-14 11:22:21,320][98391] Using port 40402 +[2023-09-14 11:22:21,320][98391] Initializing env for player 0, init_info: {'port': 40402}... +[2023-09-14 11:22:21,356][98391] Using port 40402 on host... +[2023-09-14 11:22:21,371][98391] Initializing env for player 1, init_info: {'port': 40402}... +[2023-09-14 11:22:21,430][98391] Initializing env for player 2, init_info: {'port': 40402}... +[2023-09-14 11:22:21,487][98391] Initializing env for player 3, init_info: {'port': 40402}... +[2023-09-14 11:22:21,547][98391] Initializing env for player 4, init_info: {'port': 40402}... +[2023-09-14 11:22:21,553][98394] Initialized w:3 v:2 player:1 +[2023-09-14 11:22:21,554][98394] Initialized w:3 v:2 player:4 +[2023-09-14 11:22:21,555][98394] Initialized w:3 v:2 player:3 +[2023-09-14 11:22:21,555][98394] Initialized w:3 v:2 player:7 +[2023-09-14 11:22:21,556][98394] Initialized w:3 v:2 player:5 +[2023-09-14 11:22:21,556][98394] Initialized w:3 v:2 player:0 +[2023-09-14 11:22:21,563][98394] Initialized w:3 v:2 player:2 +[2023-09-14 11:22:21,603][98391] Initializing env for player 5, init_info: {'port': 40402}... +[2023-09-14 11:22:21,646][98395] Initialized w:2 v:2 player:0 +[2023-09-14 11:22:21,647][98395] Initialized w:2 v:2 player:6 +[2023-09-14 11:22:21,648][98395] Initialized w:2 v:2 player:1 +[2023-09-14 11:22:21,648][98395] Initialized w:2 v:2 player:3 +[2023-09-14 11:22:21,648][98395] Initialized w:2 v:2 player:5 +[2023-09-14 11:22:21,649][98395] Initialized w:2 v:2 player:4 +[2023-09-14 11:22:21,649][98395] Initialized w:2 v:2 player:7 +[2023-09-14 11:22:21,649][98395] Initialized w:2 v:2 player:2 +[2023-09-14 11:22:21,651][98395] 8 agent workers initialized for env 2! +[2023-09-14 11:22:21,671][98391] Initializing env for player 6, init_info: {'port': 40402}... +[2023-09-14 11:22:21,691][98395] Decorrelating experience for 64 frames... +[2023-09-14 11:22:21,719][98391] Initializing env for player 7, init_info: {'port': 40402}... +[2023-09-14 11:22:21,723][98396] Initialized w:4 v:2 player:4 +[2023-09-14 11:22:21,724][98396] Initialized w:4 v:2 player:2 +[2023-09-14 11:22:21,724][98396] Initialized w:4 v:2 player:1 +[2023-09-14 11:22:21,724][98396] Initialized w:4 v:2 player:7 +[2023-09-14 11:22:21,724][98396] Initialized w:4 v:2 player:6 +[2023-09-14 11:22:21,725][98396] Initialized w:4 v:2 player:0 +[2023-09-14 11:22:21,725][98396] Initialized w:4 v:2 player:5 +[2023-09-14 11:22:21,725][98396] Initialized w:4 v:2 player:3 +[2023-09-14 11:22:21,727][98396] 8 agent workers initialized for env 4! +[2023-09-14 11:22:21,770][98396] Decorrelating experience for 64 frames... +[2023-09-14 11:22:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:22:22,221][98395] Port 40503 is available +[2023-09-14 11:22:22,222][98395] Using port 40503 +[2023-09-14 11:22:22,223][98395] Initializing env for player 0, init_info: {'port': 40503}... +[2023-09-14 11:22:22,253][98395] Using port 40503 on host... +[2023-09-14 11:22:22,273][98395] Initializing env for player 1, init_info: {'port': 40503}... +[2023-09-14 11:22:22,323][98396] Port 40703 is available +[2023-09-14 11:22:22,323][98396] Using port 40703 +[2023-09-14 11:22:22,323][98396] Initializing env for player 0, init_info: {'port': 40703}... +[2023-09-14 11:22:22,327][98395] Initializing env for player 2, init_info: {'port': 40503}... +[2023-09-14 11:22:22,353][98396] Using port 40703 on host... +[2023-09-14 11:22:22,374][98396] Initializing env for player 1, init_info: {'port': 40703}... +[2023-09-14 11:22:22,383][98395] Initializing env for player 3, init_info: {'port': 40503}... +[2023-09-14 11:22:22,429][98396] Initializing env for player 2, init_info: {'port': 40703}... +[2023-09-14 11:22:22,439][98395] Initializing env for player 4, init_info: {'port': 40503}... +[2023-09-14 11:22:22,479][98396] Initializing env for player 3, init_info: {'port': 40703}... +[2023-09-14 11:22:22,495][98395] Initializing env for player 5, init_info: {'port': 40503}... +[2023-09-14 11:22:22,543][98395] Initializing env for player 6, init_info: {'port': 40503}... +[2023-09-14 11:22:22,544][98396] Initializing env for player 4, init_info: {'port': 40703}... +[2023-09-14 11:22:22,552][98394] Initialized w:3 v:2 player:6 +[2023-09-14 11:22:22,554][98394] 8 agent workers initialized for env 3! +[2023-09-14 11:22:22,575][98399] Initializing env for player 0, init_info: {'port': 40902}... +[2023-09-14 11:22:22,595][98396] Initializing env for player 5, init_info: {'port': 40703}... +[2023-09-14 11:22:22,599][98395] Initializing env for player 7, init_info: {'port': 40503}... +[2023-09-14 11:22:22,620][98399] Using port 40902 on host... +[2023-09-14 11:22:22,631][98399] Initializing env for player 1, init_info: {'port': 40902}... +[2023-09-14 11:22:22,640][98394] Decorrelating experience for 64 frames... +[2023-09-14 11:22:22,649][98396] Initializing env for player 6, init_info: {'port': 40703}... +[2023-09-14 11:22:22,686][98399] Initializing env for player 2, init_info: {'port': 40902}... +[2023-09-14 11:22:22,715][98396] Initializing env for player 7, init_info: {'port': 40703}... +[2023-09-14 11:22:22,751][98399] Initializing env for player 3, init_info: {'port': 40902}... +[2023-09-14 11:22:22,795][98399] Initializing env for player 4, init_info: {'port': 40902}... +[2023-09-14 11:22:22,855][98399] Initializing env for player 5, init_info: {'port': 40902}... +[2023-09-14 11:22:22,919][98399] Initializing env for player 6, init_info: {'port': 40902}... +[2023-09-14 11:22:22,983][98399] Initializing env for player 7, init_info: {'port': 40902}... +[2023-09-14 11:22:23,107][98391] Initialized w:1 v:2 player:7 +[2023-09-14 11:22:23,108][98391] Initialized w:1 v:2 player:6 +[2023-09-14 11:22:23,108][98391] Initialized w:1 v:2 player:2 +[2023-09-14 11:22:23,108][98391] Initialized w:1 v:2 player:0 +[2023-09-14 11:22:23,108][98391] Initialized w:1 v:2 player:5 +[2023-09-14 11:22:23,108][98391] Initialized w:1 v:2 player:1 +[2023-09-14 11:22:23,108][98391] Initialized w:1 v:2 player:3 +[2023-09-14 11:22:23,108][98391] Initialized w:1 v:2 player:4 +[2023-09-14 11:22:23,111][98391] 8 agent workers initialized for env 1! +[2023-09-14 11:22:23,144][98391] Decorrelating experience for 64 frames... +[2023-09-14 11:22:23,163][98394] Port 40603 is available +[2023-09-14 11:22:23,163][98394] Using port 40603 +[2023-09-14 11:22:23,164][98394] Initializing env for player 0, init_info: {'port': 40603}... +[2023-09-14 11:22:23,193][98394] Using port 40603 on host... +[2023-09-14 11:22:23,214][98394] Initializing env for player 1, init_info: {'port': 40603}... +[2023-09-14 11:22:23,275][98394] Initializing env for player 2, init_info: {'port': 40603}... +[2023-09-14 11:22:23,327][98394] Initializing env for player 3, init_info: {'port': 40603}... +[2023-09-14 11:22:23,383][98394] Initializing env for player 4, init_info: {'port': 40603}... +[2023-09-14 11:22:23,434][98394] Initializing env for player 5, init_info: {'port': 40603}... +[2023-09-14 11:22:23,491][98394] Initializing env for player 6, init_info: {'port': 40603}... +[2023-09-14 11:22:23,547][98394] Initializing env for player 7, init_info: {'port': 40603}... +[2023-09-14 11:22:23,666][98391] Port 40403 is available +[2023-09-14 11:22:23,666][98391] Using port 40403 +[2023-09-14 11:22:23,667][98391] Initializing env for player 0, init_info: {'port': 40403}... +[2023-09-14 11:22:23,695][98391] Using port 40403 on host... +[2023-09-14 11:22:23,717][98391] Initializing env for player 1, init_info: {'port': 40403}... +[2023-09-14 11:22:23,768][98391] Initializing env for player 2, init_info: {'port': 40403}... +[2023-09-14 11:22:23,829][98391] Initializing env for player 3, init_info: {'port': 40403}... +[2023-09-14 11:22:23,887][98391] Initializing env for player 4, init_info: {'port': 40403}... +[2023-09-14 11:22:23,939][98391] Initializing env for player 5, init_info: {'port': 40403}... +[2023-09-14 11:22:23,972][98396] Initialized w:4 v:3 player:7 +[2023-09-14 11:22:23,972][98396] Initialized w:4 v:3 player:3 +[2023-09-14 11:22:23,973][98396] Initialized w:4 v:3 player:1 +[2023-09-14 11:22:23,973][98396] Initialized w:4 v:3 player:6 +[2023-09-14 11:22:23,973][98396] Initialized w:4 v:3 player:2 +[2023-09-14 11:22:23,973][98396] Initialized w:4 v:3 player:4 +[2023-09-14 11:22:23,973][98396] Initialized w:4 v:3 player:5 +[2023-09-14 11:22:23,974][98396] Initialized w:4 v:3 player:0 +[2023-09-14 11:22:23,976][98396] 8 agent workers initialized for env 4! +[2023-09-14 11:22:23,987][98391] Initializing env for player 6, init_info: {'port': 40403}... +[2023-09-14 11:22:24,016][98396] Decorrelating experience for 96 frames... +[2023-09-14 11:22:24,051][98391] Initializing env for player 7, init_info: {'port': 40403}... +[2023-09-14 11:22:24,062][98395] Initialized w:2 v:3 player:7 +[2023-09-14 11:22:24,062][98395] Initialized w:2 v:3 player:3 +[2023-09-14 11:22:24,063][98395] Initialized w:2 v:3 player:0 +[2023-09-14 11:22:24,063][98395] Initialized w:2 v:3 player:5 +[2023-09-14 11:22:24,063][98395] Initialized w:2 v:3 player:2 +[2023-09-14 11:22:24,064][98395] Initialized w:2 v:3 player:1 +[2023-09-14 11:22:24,064][98395] Initialized w:2 v:3 player:6 +[2023-09-14 11:22:24,064][98395] Initialized w:2 v:3 player:4 +[2023-09-14 11:22:24,066][98395] 8 agent workers initialized for env 2! +[2023-09-14 11:22:24,117][98395] Decorrelating experience for 96 frames... +[2023-09-14 11:22:24,211][98399] Initialized w:6 v:2 player:7 +[2023-09-14 11:22:24,211][98399] Initialized w:6 v:2 player:0 +[2023-09-14 11:22:24,212][98399] Initialized w:6 v:2 player:1 +[2023-09-14 11:22:24,212][98399] Initialized w:6 v:2 player:4 +[2023-09-14 11:22:24,212][98399] Initialized w:6 v:2 player:6 +[2023-09-14 11:22:24,212][98399] Initialized w:6 v:2 player:2 +[2023-09-14 11:22:24,212][98399] Initialized w:6 v:2 player:5 +[2023-09-14 11:22:24,213][98399] Initialized w:6 v:2 player:3 +[2023-09-14 11:22:24,215][98399] 8 agent workers initialized for env 6! +[2023-09-14 11:22:24,264][98399] Decorrelating experience for 64 frames... +[2023-09-14 11:22:24,810][98394] Initialized w:3 v:3 player:5 +[2023-09-14 11:22:24,813][98394] Initialized w:3 v:3 player:2 +[2023-09-14 11:22:24,813][98394] Initialized w:3 v:3 player:3 +[2023-09-14 11:22:24,813][98394] Initialized w:3 v:3 player:4 +[2023-09-14 11:22:24,813][98394] Initialized w:3 v:3 player:0 +[2023-09-14 11:22:24,813][98394] Initialized w:3 v:3 player:1 +[2023-09-14 11:22:24,813][98394] Initialized w:3 v:3 player:7 +[2023-09-14 11:22:24,813][98394] Initialized w:3 v:3 player:6 +[2023-09-14 11:22:24,817][98394] 8 agent workers initialized for env 3! +[2023-09-14 11:22:24,876][98394] Decorrelating experience for 96 frames... +[2023-09-14 11:22:24,961][98399] Port 40903 is available +[2023-09-14 11:22:24,961][98399] Using port 40903 +[2023-09-14 11:22:24,962][98399] Initializing env for player 0, init_info: {'port': 40903}... +[2023-09-14 11:22:25,000][98399] Using port 40903 on host... +[2023-09-14 11:22:25,014][98399] Initializing env for player 1, init_info: {'port': 40903}... +[2023-09-14 11:22:25,064][98399] Initializing env for player 2, init_info: {'port': 40903}... +[2023-09-14 11:22:25,115][98399] Initializing env for player 3, init_info: {'port': 40903}... +[2023-09-14 11:22:25,171][98399] Initializing env for player 4, init_info: {'port': 40903}... +[2023-09-14 11:22:25,239][98399] Initializing env for player 5, init_info: {'port': 40903}... +[2023-09-14 11:22:25,287][98399] Initializing env for player 6, init_info: {'port': 40903}... +[2023-09-14 11:22:25,347][98399] Initializing env for player 7, init_info: {'port': 40903}... +[2023-09-14 11:22:25,367][98391] Initialized w:1 v:3 player:7 +[2023-09-14 11:22:25,369][98391] Initialized w:1 v:3 player:2 +[2023-09-14 11:22:25,369][98391] Initialized w:1 v:3 player:0 +[2023-09-14 11:22:25,370][98391] Initialized w:1 v:3 player:3 +[2023-09-14 11:22:25,370][98391] Initialized w:1 v:3 player:5 +[2023-09-14 11:22:25,370][98391] Initialized w:1 v:3 player:6 +[2023-09-14 11:22:25,370][98391] Initialized w:1 v:3 player:1 +[2023-09-14 11:22:25,371][98391] Initialized w:1 v:3 player:4 +[2023-09-14 11:22:25,373][98391] 8 agent workers initialized for env 1! +[2023-09-14 11:22:25,426][98391] Decorrelating experience for 96 frames... +[2023-09-14 11:22:25,980][98398] Port 41000 is available +[2023-09-14 11:22:25,980][98398] Using port 41000 +[2023-09-14 11:22:25,981][98398] Initializing env for player 0, init_info: {'port': 41000}... +[2023-09-14 11:22:26,019][98398] Using port 41000 on host... +[2023-09-14 11:22:26,031][98398] Initializing env for player 1, init_info: {'port': 41000}... +[2023-09-14 11:22:26,082][98398] Initializing env for player 2, init_info: {'port': 41000}... +[2023-09-14 11:22:26,132][98398] Initializing env for player 3, init_info: {'port': 41000}... +[2023-09-14 11:22:26,195][98398] Initializing env for player 4, init_info: {'port': 41000}... +[2023-09-14 11:22:26,246][98398] Initializing env for player 5, init_info: {'port': 41000}... +[2023-09-14 11:22:26,307][98398] Initializing env for player 6, init_info: {'port': 41000}... +[2023-09-14 11:22:26,363][98398] Initializing env for player 7, init_info: {'port': 41000}... +[2023-09-14 11:22:26,521][98399] Initialized w:6 v:3 player:3 +[2023-09-14 11:22:26,522][98399] Initialized w:6 v:3 player:0 +[2023-09-14 11:22:26,523][98399] Initialized w:6 v:3 player:4 +[2023-09-14 11:22:26,524][98399] Initialized w:6 v:3 player:2 +[2023-09-14 11:22:26,524][98399] Initialized w:6 v:3 player:6 +[2023-09-14 11:22:26,524][98399] Initialized w:6 v:3 player:7 +[2023-09-14 11:22:26,524][98399] Initialized w:6 v:3 player:5 +[2023-09-14 11:22:26,524][98399] Initialized w:6 v:3 player:1 +[2023-09-14 11:22:26,526][98399] 8 agent workers initialized for env 6! +[2023-09-14 11:22:26,567][98399] Decorrelating experience for 96 frames... +[2023-09-14 11:22:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:22:27,200][98257] Signal inference workers to stop experience collection... +[2023-09-14 11:22:27,213][98392] InferenceWorker_p0-w0: stopping experience collection +[2023-09-14 11:22:27,637][98398] Initialized w:7 v:0 player:7 +[2023-09-14 11:22:27,638][98398] Initialized w:7 v:0 player:1 +[2023-09-14 11:22:27,638][98398] Initialized w:7 v:0 player:2 +[2023-09-14 11:22:27,639][98398] Initialized w:7 v:0 player:3 +[2023-09-14 11:22:27,640][98398] Initialized w:7 v:0 player:6 +[2023-09-14 11:22:27,640][98398] Initialized w:7 v:0 player:4 +[2023-09-14 11:22:27,640][98398] Initialized w:7 v:0 player:0 +[2023-09-14 11:22:27,641][98398] Initialized w:7 v:0 player:5 +[2023-09-14 11:22:27,642][98398] 8 agent workers initialized for env 7! +[2023-09-14 11:22:27,676][98398] Decorrelating experience for 0 frames... +[2023-09-14 11:22:27,677][98398] Port 41001 is available +[2023-09-14 11:22:27,677][98398] Using port 41001 +[2023-09-14 11:22:27,678][98398] Initializing env for player 0, init_info: {'port': 41001}... +[2023-09-14 11:22:27,706][98398] Using port 41001 on host... +[2023-09-14 11:22:27,728][98398] Initializing env for player 1, init_info: {'port': 41001}... +[2023-09-14 11:22:27,779][98398] Initializing env for player 2, init_info: {'port': 41001}... +[2023-09-14 11:22:27,831][98398] Initializing env for player 3, init_info: {'port': 41001}... +[2023-09-14 11:22:27,887][98398] Initializing env for player 4, init_info: {'port': 41001}... +[2023-09-14 11:22:27,947][98398] Initializing env for player 5, init_info: {'port': 41001}... +[2023-09-14 11:22:27,999][98398] Initializing env for player 6, init_info: {'port': 41001}... +[2023-09-14 11:22:28,047][98398] Initializing env for player 7, init_info: {'port': 41001}... +[2023-09-14 11:22:28,301][98257] EvtLoop [learner_proc0_evt_loop, process=learner_proc0] unhandled exception in slot='on_new_training_batch' connected to emitter=Emitter(object_id='Batcher_0', signal_name='training_batches_available'), args=(0,) +Traceback (most recent call last): + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py", line 355, in _process_signal + slot_callable(*args) + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner_worker.py", line 150, in on_new_training_batch + stats = self.learner.train(self.batcher.training_batches[batch_idx]) + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 1046, in train + train_stats = self._train(buff, self.cfg.batch_size, experience_size, num_invalids) + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 731, in _train + ) = self._calculate_losses(mb, num_invalids) + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 649, in _calculate_losses + exploration_loss = self.exploration_loss_func(action_distribution, valids, num_invalids) + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 477, in _symmetric_kl_exploration_loss + kl_prior = action_distribution.symmetric_kl_with_uniform_prior() + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py", line 247, in symmetric_kl_with_uniform_prior + sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions] + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py", line 247, in + sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions] +AttributeError: 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' +[2023-09-14 11:22:28,302][98257] Unhandled exception 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' in evt loop learner_proc0_evt_loop +[2023-09-14 11:22:29,282][98398] Initialized w:7 v:1 player:2 +[2023-09-14 11:22:29,284][98398] Initialized w:7 v:1 player:3 +[2023-09-14 11:22:29,284][98398] Initialized w:7 v:1 player:6 +[2023-09-14 11:22:29,284][98398] Initialized w:7 v:1 player:7 +[2023-09-14 11:22:29,285][98398] Initialized w:7 v:1 player:4 +[2023-09-14 11:22:29,285][98398] Initialized w:7 v:1 player:1 +[2023-09-14 11:22:29,285][98398] Initialized w:7 v:1 player:0 +[2023-09-14 11:22:29,285][98398] Initialized w:7 v:1 player:5 +[2023-09-14 11:22:29,287][98398] 8 agent workers initialized for env 7! +[2023-09-14 11:22:29,327][98398] Decorrelating experience for 32 frames... +[2023-09-14 11:22:29,587][98398] Multi agent env, num agents: 8 +[2023-09-14 11:22:29,616][98398] Multi agent env, num agents: 8 +[2023-09-14 11:22:29,645][98398] Port 41002 is available +[2023-09-14 11:22:29,645][98398] Using port 41002 +[2023-09-14 11:22:29,646][98398] Initializing env for player 0, init_info: {'port': 41002}... +[2023-09-14 11:22:29,679][98398] Using port 41002 on host... +[2023-09-14 11:22:29,696][98398] Initializing env for player 1, init_info: {'port': 41002}... +[2023-09-14 11:22:29,747][98398] Initializing env for player 2, init_info: {'port': 41002}... +[2023-09-14 11:22:29,797][98398] Initializing env for player 3, init_info: {'port': 41002}... +[2023-09-14 11:22:29,867][98398] Initializing env for player 4, init_info: {'port': 41002}... +[2023-09-14 11:22:29,927][98398] Initializing env for player 5, init_info: {'port': 41002}... +[2023-09-14 11:22:29,985][98398] Initializing env for player 6, init_info: {'port': 41002}... +[2023-09-14 11:22:30,027][98398] Initializing env for player 7, init_info: {'port': 41002}... +[2023-09-14 11:22:31,101][97397] Heartbeat connected on Batcher_0 +[2023-09-14 11:22:31,107][97397] Heartbeat connected on InferenceWorker_p0-w0 +[2023-09-14 11:22:31,115][97397] Heartbeat connected on RolloutWorker_w1 +[2023-09-14 11:22:31,118][97397] Heartbeat connected on RolloutWorker_w2 +[2023-09-14 11:22:31,121][97397] Heartbeat connected on RolloutWorker_w3 +[2023-09-14 11:22:31,124][97397] Heartbeat connected on RolloutWorker_w4 +[2023-09-14 11:22:31,130][97397] Heartbeat connected on RolloutWorker_w6 +[2023-09-14 11:22:31,151][98398] Initialized w:7 v:2 player:1 +[2023-09-14 11:22:31,151][98398] Initialized w:7 v:2 player:4 +[2023-09-14 11:22:31,152][98398] Initialized w:7 v:2 player:5 +[2023-09-14 11:22:31,152][98398] Initialized w:7 v:2 player:6 +[2023-09-14 11:22:31,153][98398] Initialized w:7 v:2 player:0 +[2023-09-14 11:22:31,153][98398] Initialized w:7 v:2 player:7 +[2023-09-14 11:22:31,153][98398] Initialized w:7 v:2 player:3 +[2023-09-14 11:22:31,154][98398] Initialized w:7 v:2 player:2 +[2023-09-14 11:22:31,156][98398] 8 agent workers initialized for env 7! +[2023-09-14 11:22:31,212][98398] Decorrelating experience for 64 frames... +[2023-09-14 11:22:31,689][98398] Port 41003 is available +[2023-09-14 11:22:31,689][98398] Using port 41003 +[2023-09-14 11:22:31,690][98398] Initializing env for player 0, init_info: {'port': 41003}... +[2023-09-14 11:22:31,718][98398] Using port 41003 on host... +[2023-09-14 11:22:31,740][98398] Initializing env for player 1, init_info: {'port': 41003}... +[2023-09-14 11:22:31,798][98398] Initializing env for player 2, init_info: {'port': 41003}... +[2023-09-14 11:22:31,848][98398] Initializing env for player 3, init_info: {'port': 41003}... +[2023-09-14 11:22:31,907][98398] Initializing env for player 4, init_info: {'port': 41003}... +[2023-09-14 11:22:31,955][98398] Initializing env for player 5, init_info: {'port': 41003}... +[2023-09-14 11:22:32,008][98398] Initializing env for player 6, init_info: {'port': 41003}... +[2023-09-14 11:22:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 251.7. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:22:32,055][98398] Initializing env for player 7, init_info: {'port': 41003}... +[2023-09-14 11:22:33,297][98398] Initialized w:7 v:3 player:1 +[2023-09-14 11:22:33,300][98398] Initialized w:7 v:3 player:3 +[2023-09-14 11:22:33,300][98398] Initialized w:7 v:3 player:4 +[2023-09-14 11:22:33,300][98398] Initialized w:7 v:3 player:6 +[2023-09-14 11:22:33,300][98398] Initialized w:7 v:3 player:2 +[2023-09-14 11:22:33,300][98398] Initialized w:7 v:3 player:7 +[2023-09-14 11:22:33,300][98398] Initialized w:7 v:3 player:5 +[2023-09-14 11:22:33,301][98398] Initialized w:7 v:3 player:0 +[2023-09-14 11:22:33,303][98398] 8 agent workers initialized for env 7! +[2023-09-14 11:22:33,345][98398] Decorrelating experience for 96 frames... +[2023-09-14 11:22:33,999][97397] Heartbeat connected on RolloutWorker_w7 +[2023-09-14 11:22:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 188.8. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:22:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 151.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:22:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 125.9. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:22:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 107.9. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:22:57,032][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 94.4. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:23:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 83.9. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:23:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 83.9. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:23:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 83.9. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:23:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:23:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:23:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:23:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:23:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:23:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:23:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:23:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:23:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:24:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:24:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:24:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:24:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:24:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:24:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:24:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:24:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:24:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:24:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:24:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:24:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:25:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:25:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:25:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:25:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:25:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:25:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:25:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:25:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:25:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:25:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:25:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:25:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:26:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:26:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:26:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:26:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:26:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:26:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:26:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:26:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:26:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:26:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:26:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:26:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:27:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:27:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:27:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:27:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:27:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:27:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:27:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:27:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:27:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:27:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:27:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:27:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:28:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:28:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:28:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:28:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:28:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:28:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:28:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:28:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:28:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:28:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:28:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:28:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:29:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:29:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:29:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:29:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:29:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:29:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:29:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:29:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:29:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:29:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:29:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:29:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:30:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:30:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:30:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:30:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:30:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:30:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:30:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:30:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:30:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:30:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:30:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:30:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:31:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:31:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:31:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:31:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:31:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:31:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:31:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:31:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:31:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:31:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:31:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:31:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:32:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:32:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:32:07,036][97397] Components not started: LearnerWorker_p0, RolloutWorker_w0, RolloutWorker_w5, wait_time=600.0 seconds +[2023-09-14 11:32:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:32:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:32:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:32:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:32:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:32:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:32:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:32:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:32:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:32:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:33:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:33:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:33:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:33:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:33:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:33:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:33:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:33:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:33:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:33:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:33:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:33:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:34:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:34:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:34:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:34:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:34:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:34:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:34:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:34:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:34:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:34:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:34:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:34:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:35:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:35:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:35:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:35:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:35:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:35:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:35:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:35:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:35:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:35:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:35:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:35:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:36:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:36:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:36:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:36:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:36:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:36:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:36:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:36:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:36:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:36:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:36:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:36:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:37:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:37:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:37:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:37:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:37:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:37:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:37:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:37:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:37:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:37:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:37:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:37:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:38:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:38:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:38:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:38:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:38:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:38:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:38:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:38:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:38:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:38:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:38:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:38:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:39:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:39:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:39:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:39:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:39:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:39:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:39:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:39:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:39:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:39:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:39:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:39:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:40:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:40:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:40:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:40:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:40:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:40:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:40:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:40:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:40:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:40:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:40:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:40:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:41:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:41:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:41:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:41:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:41:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:41:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:41:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:41:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:41:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:41:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:41:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:41:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:42:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:42:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:42:07,035][97397] Components not started: LearnerWorker_p0, RolloutWorker_w0, RolloutWorker_w5, wait_time=1200.0 seconds +[2023-09-14 11:42:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:42:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:42:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:42:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:42:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:42:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:42:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:42:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:42:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:42:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:43:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:43:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:43:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:43:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:43:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:43:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:43:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:43:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:43:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:43:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:43:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:43:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:44:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:44:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:44:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:44:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:44:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:44:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:44:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:44:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:44:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:44:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:44:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:44:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:45:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:45:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:45:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:45:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:45:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:45:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:45:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:45:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:45:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:45:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:45:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:45:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:46:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:46:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:46:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:46:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:46:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:46:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:46:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:46:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:46:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:46:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:46:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:46:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:47:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:47:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:47:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:47:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:47:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:47:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:47:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:47:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:47:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:47:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:47:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:47:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:48:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:48:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:48:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:48:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:48:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:48:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:48:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:48:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:48:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:48:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:48:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:48:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:49:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:49:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:49:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:49:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:49:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:49:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:49:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:49:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:49:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:49:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:49:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:49:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:50:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:50:07,032][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:50:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:50:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:50:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:50:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:50:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:50:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:50:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:50:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:50:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:50:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:51:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:51:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:51:12,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:51:17,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:51:22,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:51:27,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:51:32,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:51:37,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:51:42,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:51:47,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:51:52,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:51:57,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:52:02,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:52:07,031][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3776. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:52:07,034][97397] Components not started: LearnerWorker_p0, RolloutWorker_w0, RolloutWorker_w5, wait_time=1800.0 seconds +[2023-09-14 11:52:07,036][97397] Components take too long to start: LearnerWorker_p0, RolloutWorker_w0, RolloutWorker_w5. Aborting the experiment! + + + +[2023-09-14 11:52:07,039][98257] Stopping Batcher_0... +[2023-09-14 11:52:07,040][98257] Loop batcher_evt_loop terminating... +[2023-09-14 11:52:07,039][97397] Component Batcher_0 stopped! +[2023-09-14 11:52:07,041][97397] Waiting for ['LearnerWorker_p0', 'InferenceWorker_p0-w0', 'RolloutWorker_w0', 'RolloutWorker_w1', 'RolloutWorker_w2', 'RolloutWorker_w3', 'RolloutWorker_w4', 'RolloutWorker_w5', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... +[2023-09-14 11:52:07,055][98392] Weights refcount: 2 0 +[2023-09-14 11:52:07,057][98392] Stopping InferenceWorker_p0-w0... +[2023-09-14 11:52:07,057][98392] Loop inference_proc0-0_evt_loop terminating... +[2023-09-14 11:52:07,057][97397] Component InferenceWorker_p0-w0 stopped! +[2023-09-14 11:52:07,058][97397] Waiting for ['LearnerWorker_p0', 'RolloutWorker_w0', 'RolloutWorker_w1', 'RolloutWorker_w2', 'RolloutWorker_w3', 'RolloutWorker_w4', 'RolloutWorker_w5', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... +[2023-09-14 11:52:10,256][98391] Stopping RolloutWorker_w1... +[2023-09-14 11:52:10,256][98391] Loop rollout_proc1_evt_loop terminating... +[2023-09-14 11:52:10,257][98396] Stopping RolloutWorker_w4... +[2023-09-14 11:52:10,257][98394] Stopping RolloutWorker_w3... +[2023-09-14 11:52:10,257][98396] Loop rollout_proc4_evt_loop terminating... +[2023-09-14 11:52:10,258][98394] Loop rollout_proc3_evt_loop terminating... +[2023-09-14 11:52:10,258][98398] Stopping RolloutWorker_w7... +[2023-09-14 11:52:10,257][97397] Component LearnerWorker_p0 process died already! Don't wait for it. +[2023-09-14 11:52:10,258][98398] Loop rollout_proc7_evt_loop terminating... +[2023-09-14 11:52:10,259][98399] Stopping RolloutWorker_w6... +[2023-09-14 11:52:10,258][97397] Component RolloutWorker_w1 stopped! +[2023-09-14 11:52:10,260][98399] Loop rollout_proc6_evt_loop terminating... +[2023-09-14 11:52:10,261][98395] Stopping RolloutWorker_w2... +[2023-09-14 11:52:10,261][97397] Waiting for ['RolloutWorker_w0', 'RolloutWorker_w2', 'RolloutWorker_w3', 'RolloutWorker_w4', 'RolloutWorker_w5', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... +[2023-09-14 11:52:10,262][98395] Loop rollout_proc2_evt_loop terminating... +[2023-09-14 11:52:10,262][97397] Component RolloutWorker_w4 stopped! +[2023-09-14 11:52:10,264][97397] Waiting for ['RolloutWorker_w0', 'RolloutWorker_w2', 'RolloutWorker_w3', 'RolloutWorker_w5', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... +[2023-09-14 11:52:10,265][97397] Component RolloutWorker_w3 stopped! +[2023-09-14 11:52:10,266][97397] Waiting for ['RolloutWorker_w0', 'RolloutWorker_w2', 'RolloutWorker_w5', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... +[2023-09-14 11:52:10,267][97397] Component RolloutWorker_w7 stopped! +[2023-09-14 11:52:10,268][97397] Waiting for ['RolloutWorker_w0', 'RolloutWorker_w2', 'RolloutWorker_w5', 'RolloutWorker_w6'] to stop... +[2023-09-14 11:52:10,269][97397] Component RolloutWorker_w6 stopped! +[2023-09-14 11:52:10,270][97397] Waiting for ['RolloutWorker_w0', 'RolloutWorker_w2', 'RolloutWorker_w5'] to stop... +[2023-09-14 11:52:10,271][97397] Component RolloutWorker_w2 stopped! +[2023-09-14 11:52:10,272][97397] Waiting for ['RolloutWorker_w0', 'RolloutWorker_w5'] to stop... +[2023-09-14 11:58:18,082][97397] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 97397], exiting... +[2023-09-14 11:58:18,084][97397] Runner profile tree view: +main_loop: 2166.9503 +[2023-09-14 11:58:18,086][97397] Collected {0: 0}, FPS: 0.0 +[2023-09-14 11:59:16,308][97397] Environment doom_basic already registered, overwriting... +[2023-09-14 11:59:16,310][97397] Environment doom_two_colors_easy already registered, overwriting... +[2023-09-14 11:59:16,313][97397] Environment doom_two_colors_hard already registered, overwriting... +[2023-09-14 11:59:16,315][97397] Environment doom_dm already registered, overwriting... +[2023-09-14 11:59:16,316][97397] Environment doom_dwango5 already registered, overwriting... +[2023-09-14 11:59:16,317][97397] Environment doom_my_way_home_flat_actions already registered, overwriting... +[2023-09-14 11:59:16,318][97397] Environment doom_defend_the_center_flat_actions already registered, overwriting... +[2023-09-14 11:59:16,319][97397] Environment doom_my_way_home already registered, overwriting... +[2023-09-14 11:59:16,319][97397] Environment doom_deadly_corridor already registered, overwriting... +[2023-09-14 11:59:16,320][97397] Environment doom_defend_the_center already registered, overwriting... +[2023-09-14 11:59:16,321][97397] Environment doom_defend_the_line already registered, overwriting... +[2023-09-14 11:59:16,322][97397] Environment doom_health_gathering already registered, overwriting... +[2023-09-14 11:59:16,323][97397] Environment doom_health_gathering_supreme already registered, overwriting... +[2023-09-14 11:59:16,324][97397] Environment doom_battle already registered, overwriting... +[2023-09-14 11:59:16,325][97397] Environment doom_battle2 already registered, overwriting... +[2023-09-14 11:59:16,325][97397] Environment doom_duel_bots already registered, overwriting... +[2023-09-14 11:59:16,326][97397] Environment doom_deathmatch_bots already registered, overwriting... +[2023-09-14 11:59:16,327][97397] Environment doom_duel already registered, overwriting... +[2023-09-14 11:59:16,328][97397] Environment doom_deathmatch_full already registered, overwriting... +[2023-09-14 11:59:16,329][97397] Environment doom_benchmark already registered, overwriting... +[2023-09-14 11:59:16,329][97397] register_encoder_factory: +[2023-09-14 11:59:16,355][97397] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json +[2023-09-14 11:59:16,356][97397] Overriding arg 'env' with value 'doom_dm' passed from command line +[2023-09-14 11:59:16,360][97397] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists! +[2023-09-14 11:59:16,361][97397] Resuming existing experiment from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment... +[2023-09-14 11:59:16,361][97397] Weights and Biases integration disabled +[2023-09-14 11:59:16,363][97397] Environment var CUDA_VISIBLE_DEVICES is 0,1 + +[2023-09-14 11:59:18,348][97397] Starting experiment with the following configuration: +help=False +algo=APPO +env=doom_dm +experiment=default_experiment +train_dir=/home/cogstack/Documents/optuna/environments/sample_factory/train_dir +restart_behavior=resume +device=gpu +seed=None +num_policies=1 +async_rl=True +serial_mode=False +batched_sampling=False +num_batches_to_accumulate=2 +worker_num_splits=2 +policy_workers_per_policy=1 +max_policy_lag=1000 +num_workers=8 +num_envs_per_worker=4 +batch_size=1024 +num_batches_per_epoch=1 +num_epochs=1 +rollout=32 +recurrence=32 +shuffle_minibatches=False +gamma=0.99 +reward_scale=1.0 +reward_clip=1000.0 +value_bootstrap=False +normalize_returns=True +exploration_loss_coeff=0.001 +value_loss_coeff=0.5 +kl_loss_coeff=0.0 +exploration_loss=symmetric_kl +gae_lambda=0.95 +ppo_clip_ratio=0.1 +ppo_clip_value=0.2 +with_vtrace=False +vtrace_rho=1.0 +vtrace_c=1.0 +optimizer=adam +adam_eps=1e-06 +adam_beta1=0.9 +adam_beta2=0.999 +max_grad_norm=4.0 +learning_rate=0.0001 +lr_schedule=constant +lr_schedule_kl_threshold=0.008 +lr_adaptive_min=1e-06 +lr_adaptive_max=0.01 +obs_subtract_mean=0.0 +obs_scale=255.0 +normalize_input=True +normalize_input_keys=None +decorrelate_experience_max_seconds=0 +decorrelate_envs_on_one_worker=True +actor_worker_gpus=[] +set_workers_cpu_affinity=True +force_envs_single_thread=False +default_niceness=0 +log_to_file=True +experiment_summaries_interval=10 +flush_summaries_interval=30 +stats_avg=100 +summaries_use_frameskip=True +heartbeat_interval=20 +heartbeat_reporting_interval=600 +train_for_env_steps=1000000 +train_for_seconds=10000000000 +save_every_sec=120 +keep_checkpoints=2 +load_checkpoint_kind=latest +save_milestones_sec=-1 +save_best_every_sec=5 +save_best_metric=reward +save_best_after=100000 +benchmark=False +encoder_mlp_layers=[512, 512] +encoder_conv_architecture=convnet_simple +encoder_conv_mlp_layers=[512] +use_rnn=True +rnn_size=512 +rnn_type=gru +rnn_num_layers=1 +decoder_mlp_layers=[] +nonlinearity=elu +policy_initialization=orthogonal +policy_init_gain=1.0 +actor_critic_share_weights=True +adaptive_stddev=True +continuous_tanh_scale=0.0 +initial_stddev=1.0 +use_env_info_cache=False +env_gpu_actions=False +env_gpu_observations=True +env_frameskip=4 +env_framestack=1 +pixel_format=CHW +use_record_episode_statistics=False +with_wandb=False +wandb_user=None +wandb_project=sample_factory +wandb_group=None +wandb_job_type=SF +wandb_tags=[] +with_pbt=False +pbt_mix_policies_in_one_env=True +pbt_period_env_steps=5000000 +pbt_start_mutation=20000000 +pbt_replace_fraction=0.3 +pbt_mutation_rate=0.15 +pbt_replace_reward_gap=0.1 +pbt_replace_reward_gap_absolute=1e-06 +pbt_optimize_gamma=False +pbt_target_objective=true_objective +pbt_perturb_min=1.1 +pbt_perturb_max=1.5 +num_agents=-1 +num_humans=0 +num_bots=-1 +start_bot_difficulty=None +timelimit=None +res_w=128 +res_h=72 +wide_aspect_ratio=False +eval_env_frameskip=1 +fps=35 +command_line=--env=doom_dm --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=20000000 +cli_args={'env': 'doom_dm', 'num_workers': 8, 'num_envs_per_worker': 4, 'train_for_env_steps': 20000000} +git_hash=20b6d44612dad7d171f23e13b1f3b4c5e5631cf9 +git_repo_name=https://github.com/MattStammers/optuna.git +[2023-09-14 11:59:18,351][97397] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... +[2023-09-14 11:59:18,519][97397] Rollout worker 0 uses device cpu +[2023-09-14 11:59:18,521][97397] Rollout worker 1 uses device cpu +[2023-09-14 11:59:18,523][97397] Rollout worker 2 uses device cpu +[2023-09-14 11:59:18,524][97397] Rollout worker 3 uses device cpu +[2023-09-14 11:59:18,524][97397] Rollout worker 4 uses device cpu +[2023-09-14 11:59:18,525][97397] Rollout worker 5 uses device cpu +[2023-09-14 11:59:18,526][97397] Rollout worker 6 uses device cpu +[2023-09-14 11:59:18,527][97397] Rollout worker 7 uses device cpu +[2023-09-14 11:59:18,700][97397] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:59:18,700][97397] InferenceWorker_p0-w0: min num requests: 2 +[2023-09-14 11:59:18,727][97397] Starting all processes... +[2023-09-14 11:59:18,728][97397] Starting process learner_proc0 +[2023-09-14 11:59:20,281][97397] Starting all processes... +[2023-09-14 11:59:20,283][82394] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:59:20,283][82394] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 +[2023-09-14 11:59:20,287][97397] Starting process inference_proc0-0 +[2023-09-14 11:59:20,288][97397] Starting process rollout_proc0 +[2023-09-14 11:59:20,289][97397] Starting process rollout_proc1 +[2023-09-14 11:59:20,289][97397] Starting process rollout_proc2 +[2023-09-14 11:59:20,290][97397] Starting process rollout_proc3 +[2023-09-14 11:59:20,290][97397] Starting process rollout_proc4 +[2023-09-14 11:59:20,325][82394] Num visible devices: 1 +[2023-09-14 11:59:20,291][97397] Starting process rollout_proc5 +[2023-09-14 11:59:20,291][97397] Starting process rollout_proc6 +[2023-09-14 11:59:20,292][97397] Starting process rollout_proc7 +[2023-09-14 11:59:20,372][82394] Starting seed is not provided +[2023-09-14 11:59:20,372][82394] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:59:20,372][82394] Initializing actor-critic model on device cuda:0 +[2023-09-14 11:59:20,372][82394] RunningMeanStd input shape: (23,) +[2023-09-14 11:59:20,373][82394] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 11:59:20,373][82394] RunningMeanStd input shape: (1,) +[2023-09-14 11:59:20,398][82394] ConvEncoder: input_channels=3 +[2023-09-14 11:59:20,572][82394] Conv encoder output size: 512 +[2023-09-14 11:59:20,573][82394] Policy head output size: 640 +[2023-09-14 11:59:20,591][82394] Created Actor Critic model with architecture: +[2023-09-14 11:59:20,591][82394] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (measurements): RunningMeanStdInPlace() + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): VizdoomEncoder( + (basic_encoder): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ELU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ELU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ELU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ELU) + ) + ) + ) + (measurements_head): Sequential( + (0): Linear(in_features=23, out_features=128, bias=True) + (1): ELU(alpha=1.0) + (2): Linear(in_features=128, out_features=128, bias=True) + (3): ELU(alpha=1.0) + ) + ) + (core): ModelCoreRNN( + (core): GRU(640, 512) + ) + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=15, bias=True) + ) +) +[2023-09-14 11:59:21,707][82394] Using optimizer +[2023-09-14 11:59:21,708][82394] No checkpoints found +[2023-09-14 11:59:21,708][82394] Did not load from checkpoint, starting from scratch! +[2023-09-14 11:59:21,709][82394] Initialized policy 0 weights for model version 0 +[2023-09-14 11:59:21,711][82394] LearnerWorker_p0 finished initialization! +[2023-09-14 11:59:21,711][82394] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:59:22,358][82479] Worker 3 uses CPU cores [12, 13, 14, 15] +[2023-09-14 11:59:22,364][82512] Worker 4 uses CPU cores [16, 17, 18, 19] +[2023-09-14 11:59:22,456][82477] Worker 1 uses CPU cores [4, 5, 6, 7] +[2023-09-14 11:59:22,495][82475] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:59:22,495][82475] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 +[2023-09-14 11:59:22,513][82475] Num visible devices: 1 +[2023-09-14 11:59:22,527][82514] Worker 6 uses CPU cores [24, 25, 26, 27] +[2023-09-14 11:59:22,593][82476] Worker 0 uses CPU cores [0, 1, 2, 3] +[2023-09-14 11:59:22,683][82480] Worker 5 uses CPU cores [20, 21, 22, 23] +[2023-09-14 11:59:22,709][82478] Worker 2 uses CPU cores [8, 9, 10, 11] +[2023-09-14 11:59:22,789][82513] Worker 7 uses CPU cores [28, 29, 30, 31] +[2023-09-14 11:59:22,789][97397] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 0. Throughput: 0: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:59:23,131][82475] RunningMeanStd input shape: (23,) +[2023-09-14 11:59:23,132][82475] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 11:59:23,132][82475] RunningMeanStd input shape: (1,) +[2023-09-14 11:59:23,144][82475] ConvEncoder: input_channels=3 +[2023-09-14 11:59:23,245][82475] Conv encoder output size: 512 +[2023-09-14 11:59:23,246][82475] Policy head output size: 640 +[2023-09-14 11:59:23,524][97397] Inference worker 0-0 is ready! +[2023-09-14 11:59:23,526][97397] All inference workers are ready! Signal rollout workers to start! +[2023-09-14 11:59:23,530][82512] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,531][82476] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,532][82478] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,532][82477] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,532][82479] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,532][82513] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,532][82514] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,533][82480] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,560][82512] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:23,563][82512] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,566][82478] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:23,566][82479] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:23,566][82476] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:23,567][82513] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:23,567][82514] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:23,568][82480] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:23,569][82479] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,570][82478] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,570][82513] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,570][82476] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,570][82514] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,572][82480] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,572][82477] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:23,576][82477] Multi agent env, num agents: 8 +[2023-09-14 11:59:23,593][82512] Port 40700 is available +[2023-09-14 11:59:23,593][82512] Using port 40700 +[2023-09-14 11:59:23,595][82512] Initializing env for player 0, init_info: {'port': 40700}... +[2023-09-14 11:59:23,600][82513] Port 41000 is available +[2023-09-14 11:59:23,600][82479] Port 40600 is available +[2023-09-14 11:59:23,600][82513] Using port 41000 +[2023-09-14 11:59:23,600][82479] Using port 40600 +[2023-09-14 11:59:23,601][82478] Port 40500 is available +[2023-09-14 11:59:23,601][82478] Using port 40500 +[2023-09-14 11:59:23,601][82479] Initializing env for player 0, init_info: {'port': 40600}... +[2023-09-14 11:59:23,601][82513] Initializing env for player 0, init_info: {'port': 41000}... +[2023-09-14 11:59:23,602][82514] Port 40900 is available +[2023-09-14 11:59:23,602][82514] Using port 40900 +[2023-09-14 11:59:23,602][82480] Port 40800 is available +[2023-09-14 11:59:23,602][82478] Initializing env for player 0, init_info: {'port': 40500}... +[2023-09-14 11:59:23,603][82480] Using port 40800 +[2023-09-14 11:59:23,603][82514] Initializing env for player 0, init_info: {'port': 40900}... +[2023-09-14 11:59:23,603][82476] Port 40300 is available +[2023-09-14 11:59:23,604][82476] Using port 40300 +[2023-09-14 11:59:23,604][82480] Initializing env for player 0, init_info: {'port': 40800}... +[2023-09-14 11:59:23,607][82477] Port 40400 is available +[2023-09-14 11:59:23,607][82477] Using port 40400 +[2023-09-14 11:59:23,608][82477] Initializing env for player 0, init_info: {'port': 40400}... +[2023-09-14 11:59:23,630][82512] Using port 40700 on host... +[2023-09-14 11:59:23,633][82480] Using port 40800 on host... +[2023-09-14 11:59:23,636][82479] Using port 40600 on host... +[2023-09-14 11:59:23,637][82513] Using port 41000 on host... +[2023-09-14 11:59:23,644][82477] Using port 40400 on host... +[2023-09-14 11:59:23,645][82512] Initializing env for player 1, init_info: {'port': 40700}... +[2023-09-14 11:59:23,652][82479] Initializing env for player 1, init_info: {'port': 40600}... +[2023-09-14 11:59:23,652][82513] Initializing env for player 1, init_info: {'port': 41000}... +[2023-09-14 11:59:23,653][82478] Initializing env for player 1, init_info: {'port': 40500}... +[2023-09-14 11:59:23,653][82514] Initializing env for player 1, init_info: {'port': 40900}... +[2023-09-14 11:59:23,654][82480] Initializing env for player 1, init_info: {'port': 40800}... +[2023-09-14 11:59:23,656][82478] Using port 40500 on host... +[2023-09-14 11:59:23,656][82514] Using port 40900 on host... +[2023-09-14 11:59:23,659][82477] Initializing env for player 1, init_info: {'port': 40400}... +[2023-09-14 11:59:23,696][82512] Initializing env for player 2, init_info: {'port': 40700}... +[2023-09-14 11:59:23,702][82479] Initializing env for player 2, init_info: {'port': 40600}... +[2023-09-14 11:59:23,703][82513] Initializing env for player 2, init_info: {'port': 41000}... +[2023-09-14 11:59:23,703][82478] Initializing env for player 2, init_info: {'port': 40500}... +[2023-09-14 11:59:23,704][82514] Initializing env for player 2, init_info: {'port': 40900}... +[2023-09-14 11:59:23,707][82480] Initializing env for player 2, init_info: {'port': 40800}... +[2023-09-14 11:59:23,711][82477] Initializing env for player 2, init_info: {'port': 40400}... +[2023-09-14 11:59:23,747][82512] Initializing env for player 3, init_info: {'port': 40700}... +[2023-09-14 11:59:23,755][82513] Initializing env for player 3, init_info: {'port': 41000}... +[2023-09-14 11:59:23,755][82479] Initializing env for player 3, init_info: {'port': 40600}... +[2023-09-14 11:59:23,757][82514] Initializing env for player 3, init_info: {'port': 40900}... +[2023-09-14 11:59:23,759][82478] Initializing env for player 3, init_info: {'port': 40500}... +[2023-09-14 11:59:23,763][82480] Initializing env for player 3, init_info: {'port': 40800}... +[2023-09-14 11:59:23,767][82477] Initializing env for player 3, init_info: {'port': 40400}... +[2023-09-14 11:59:23,798][82512] Initializing env for player 4, init_info: {'port': 40700}... +[2023-09-14 11:59:23,805][82513] Initializing env for player 4, init_info: {'port': 41000}... +[2023-09-14 11:59:23,807][82479] Initializing env for player 4, init_info: {'port': 40600}... +[2023-09-14 11:59:23,808][82478] Initializing env for player 4, init_info: {'port': 40500}... +[2023-09-14 11:59:23,811][82480] Initializing env for player 4, init_info: {'port': 40800}... +[2023-09-14 11:59:23,814][82514] Initializing env for player 4, init_info: {'port': 40900}... +[2023-09-14 11:59:23,821][82477] Initializing env for player 4, init_info: {'port': 40400}... +[2023-09-14 11:59:23,855][82512] Initializing env for player 5, init_info: {'port': 40700}... +[2023-09-14 11:59:23,856][82479] Initializing env for player 5, init_info: {'port': 40600}... +[2023-09-14 11:59:23,859][82513] Initializing env for player 5, init_info: {'port': 41000}... +[2023-09-14 11:59:23,863][82478] Initializing env for player 5, init_info: {'port': 40500}... +[2023-09-14 11:59:23,871][82480] Initializing env for player 5, init_info: {'port': 40800}... +[2023-09-14 11:59:23,875][82477] Initializing env for player 5, init_info: {'port': 40400}... +[2023-09-14 11:59:23,875][82514] Initializing env for player 5, init_info: {'port': 40900}... +[2023-09-14 11:59:23,907][82512] Initializing env for player 6, init_info: {'port': 40700}... +[2023-09-14 11:59:23,910][82513] Initializing env for player 6, init_info: {'port': 41000}... +[2023-09-14 11:59:23,911][82479] Initializing env for player 6, init_info: {'port': 40600}... +[2023-09-14 11:59:23,915][82478] Initializing env for player 6, init_info: {'port': 40500}... +[2023-09-14 11:59:23,923][82480] Initializing env for player 6, init_info: {'port': 40800}... +[2023-09-14 11:59:23,925][82477] Initializing env for player 6, init_info: {'port': 40400}... +[2023-09-14 11:59:23,935][82514] Initializing env for player 6, init_info: {'port': 40900}... +[2023-09-14 11:59:23,966][82479] Initializing env for player 7, init_info: {'port': 40600}... +[2023-09-14 11:59:23,967][82512] Initializing env for player 7, init_info: {'port': 40700}... +[2023-09-14 11:59:23,967][82513] Initializing env for player 7, init_info: {'port': 41000}... +[2023-09-14 11:59:23,967][82478] Initializing env for player 7, init_info: {'port': 40500}... +[2023-09-14 11:59:23,973][82480] Initializing env for player 7, init_info: {'port': 40800}... +[2023-09-14 11:59:23,981][82477] Initializing env for player 7, init_info: {'port': 40400}... +[2023-09-14 11:59:23,985][82514] Initializing env for player 7, init_info: {'port': 40900}... +[2023-09-14 11:59:25,377][82512] Initialized w:4 v:0 player:0 +[2023-09-14 11:59:25,378][82512] Initialized w:4 v:0 player:3 +[2023-09-14 11:59:25,380][82512] Initialized w:4 v:0 player:6 +[2023-09-14 11:59:25,381][82512] Initialized w:4 v:0 player:5 +[2023-09-14 11:59:25,381][82512] Initialized w:4 v:0 player:7 +[2023-09-14 11:59:25,381][82512] Initialized w:4 v:0 player:4 +[2023-09-14 11:59:25,381][82512] Initialized w:4 v:0 player:2 +[2023-09-14 11:59:25,381][82512] Initialized w:4 v:0 player:1 +[2023-09-14 11:59:25,383][82512] 8 agent workers initialized for env 4! +[2023-09-14 11:59:25,436][82512] Decorrelating experience for 0 frames... +[2023-09-14 11:59:25,437][82512] Port 40701 is available +[2023-09-14 11:59:25,438][82512] Using port 40701 +[2023-09-14 11:59:25,518][82478] Initialized w:2 v:0 player:6 +[2023-09-14 11:59:25,522][82478] Initialized w:2 v:0 player:3 +[2023-09-14 11:59:25,522][82478] Initialized w:2 v:0 player:7 +[2023-09-14 11:59:25,522][82478] Initialized w:2 v:0 player:5 +[2023-09-14 11:59:25,522][82478] Initialized w:2 v:0 player:2 +[2023-09-14 11:59:25,522][82478] Initialized w:2 v:0 player:4 +[2023-09-14 11:59:25,523][82478] Initialized w:2 v:0 player:1 +[2023-09-14 11:59:25,523][82478] Initialized w:2 v:0 player:0 +[2023-09-14 11:59:25,525][82478] 8 agent workers initialized for env 2! +[2023-09-14 11:59:25,563][82513] Initialized w:7 v:0 player:3 +[2023-09-14 11:59:25,564][82513] Initialized w:7 v:0 player:7 +[2023-09-14 11:59:25,564][82513] Initialized w:7 v:0 player:6 +[2023-09-14 11:59:25,565][82513] Initialized w:7 v:0 player:4 +[2023-09-14 11:59:25,566][82513] Initialized w:7 v:0 player:1 +[2023-09-14 11:59:25,566][82513] Initialized w:7 v:0 player:2 +[2023-09-14 11:59:25,566][82513] Initialized w:7 v:0 player:0 +[2023-09-14 11:59:25,569][82513] Initialized w:7 v:0 player:5 +[2023-09-14 11:59:25,569][82513] 8 agent workers initialized for env 7! +[2023-09-14 11:59:25,581][82478] Decorrelating experience for 0 frames... +[2023-09-14 11:59:25,583][82478] Port 40501 is available +[2023-09-14 11:59:25,584][82478] Using port 40501 +[2023-09-14 11:59:25,584][82478] Initializing env for player 0, init_info: {'port': 40501}... +[2023-09-14 11:59:25,598][82514] Initialized w:6 v:0 player:2 +[2023-09-14 11:59:25,598][82514] Initialized w:6 v:0 player:3 +[2023-09-14 11:59:25,599][82514] Initialized w:6 v:0 player:4 +[2023-09-14 11:59:25,599][82514] Initialized w:6 v:0 player:6 +[2023-09-14 11:59:25,600][82514] Initialized w:6 v:0 player:1 +[2023-09-14 11:59:25,600][82514] Initialized w:6 v:0 player:5 +[2023-09-14 11:59:25,600][82514] Initialized w:6 v:0 player:7 +[2023-09-14 11:59:25,601][82514] Initialized w:6 v:0 player:0 +[2023-09-14 11:59:25,602][82514] 8 agent workers initialized for env 6! +[2023-09-14 11:59:25,625][82476] Initializing env for player 0, init_info: {'port': 40300}... +[2023-09-14 11:59:25,628][82478] Using port 40501 on host... +[2023-09-14 11:59:25,631][82514] Decorrelating experience for 0 frames... +[2023-09-14 11:59:25,632][82514] Port 40901 is available +[2023-09-14 11:59:25,632][82514] Using port 40901 +[2023-09-14 11:59:25,634][82514] Initializing env for player 0, init_info: {'port': 40901}... +[2023-09-14 11:59:25,635][82478] Initializing env for player 1, init_info: {'port': 40501}... +[2023-09-14 11:59:25,637][82513] Decorrelating experience for 0 frames... +[2023-09-14 11:59:25,639][82513] Port 41001 is available +[2023-09-14 11:59:25,639][82513] Using port 41001 +[2023-09-14 11:59:25,640][82513] Initializing env for player 0, init_info: {'port': 41001}... +[2023-09-14 11:59:25,646][82477] Initialized w:1 v:0 player:7 +[2023-09-14 11:59:25,652][82477] Initialized w:1 v:0 player:1 +[2023-09-14 11:59:25,653][82477] Initialized w:1 v:0 player:2 +[2023-09-14 11:59:25,653][82477] Initialized w:1 v:0 player:4 +[2023-09-14 11:59:25,653][82477] Initialized w:1 v:0 player:0 +[2023-09-14 11:59:25,653][82477] Initialized w:1 v:0 player:6 +[2023-09-14 11:59:25,654][82477] Initialized w:1 v:0 player:5 +[2023-09-14 11:59:25,655][82476] Using port 40300 on host... +[2023-09-14 11:59:25,657][82480] Initialized w:5 v:0 player:0 +[2023-09-14 11:59:25,659][82480] Initialized w:5 v:0 player:5 +[2023-09-14 11:59:25,661][82480] Initialized w:5 v:0 player:4 +[2023-09-14 11:59:25,662][82480] Initialized w:5 v:0 player:1 +[2023-09-14 11:59:25,662][82480] Initialized w:5 v:0 player:7 +[2023-09-14 11:59:25,663][82480] Initialized w:5 v:0 player:6 +[2023-09-14 11:59:25,667][82480] Initialized w:5 v:0 player:3 +[2023-09-14 11:59:25,667][82480] Initialized w:5 v:0 player:2 +[2023-09-14 11:59:25,669][82480] 8 agent workers initialized for env 5! +[2023-09-14 11:59:25,679][82476] Initializing env for player 1, init_info: {'port': 40300}... +[2023-09-14 11:59:25,679][82514] Using port 40901 on host... +[2023-09-14 11:59:25,684][82513] Using port 41001 on host... +[2023-09-14 11:59:25,685][82479] Initialized w:3 v:0 player:4 +[2023-09-14 11:59:25,687][82479] Initialized w:3 v:0 player:1 +[2023-09-14 11:59:25,687][82479] Initialized w:3 v:0 player:7 +[2023-09-14 11:59:25,688][82514] Initializing env for player 1, init_info: {'port': 40901}... +[2023-09-14 11:59:25,687][82479] Initialized w:3 v:0 player:3 +[2023-09-14 11:59:25,687][82479] Initialized w:3 v:0 player:0 +[2023-09-14 11:59:25,687][82479] Initialized w:3 v:0 player:2 +[2023-09-14 11:59:25,688][82479] Initialized w:3 v:0 player:6 +[2023-09-14 11:59:25,688][82479] Initialized w:3 v:0 player:5 +[2023-09-14 11:59:25,691][82479] 8 agent workers initialized for env 3! +[2023-09-14 11:59:25,692][82478] Initializing env for player 2, init_info: {'port': 40501}... +[2023-09-14 11:59:25,696][82513] Initializing env for player 1, init_info: {'port': 41001}... +[2023-09-14 11:59:25,731][82476] Initializing env for player 2, init_info: {'port': 40300}... +[2023-09-14 11:59:25,736][82479] Decorrelating experience for 0 frames... +[2023-09-14 11:59:25,737][82480] Decorrelating experience for 0 frames... +[2023-09-14 11:59:25,738][82479] Port 40601 is available +[2023-09-14 11:59:25,738][82479] Using port 40601 +[2023-09-14 11:59:25,739][82479] Initializing env for player 0, init_info: {'port': 40601}... +[2023-09-14 11:59:25,739][82480] Port 40801 is available +[2023-09-14 11:59:25,739][82480] Using port 40801 +[2023-09-14 11:59:25,740][82480] Initializing env for player 0, init_info: {'port': 40801}... +[2023-09-14 11:59:25,741][82512] Initializing env for player 0, init_info: {'port': 40701}... +[2023-09-14 11:59:25,747][82478] Initializing env for player 3, init_info: {'port': 40501}... +[2023-09-14 11:59:25,748][82514] Initializing env for player 2, init_info: {'port': 40901}... +[2023-09-14 11:59:25,755][82513] Initializing env for player 2, init_info: {'port': 41001}... +[2023-09-14 11:59:25,770][82480] Using port 40801 on host... +[2023-09-14 11:59:25,771][82512] Using port 40701 on host... +[2023-09-14 11:59:25,779][82479] Using port 40601 on host... +[2023-09-14 11:59:25,779][82476] Initializing env for player 3, init_info: {'port': 40300}... +[2023-09-14 11:59:25,789][82479] Initializing env for player 1, init_info: {'port': 40601}... +[2023-09-14 11:59:25,790][82480] Initializing env for player 1, init_info: {'port': 40801}... +[2023-09-14 11:59:25,792][82512] Initializing env for player 1, init_info: {'port': 40701}... +[2023-09-14 11:59:25,797][82478] Initializing env for player 4, init_info: {'port': 40501}... +[2023-09-14 11:59:25,798][82514] Initializing env for player 3, init_info: {'port': 40901}... +[2023-09-14 11:59:25,835][82476] Initializing env for player 4, init_info: {'port': 40300}... +[2023-09-14 11:59:25,846][82480] Initializing env for player 2, init_info: {'port': 40801}... +[2023-09-14 11:59:25,846][82479] Initializing env for player 2, init_info: {'port': 40601}... +[2023-09-14 11:59:25,847][82512] Initializing env for player 2, init_info: {'port': 40701}... +[2023-09-14 11:59:25,851][82514] Initializing env for player 4, init_info: {'port': 40901}... +[2023-09-14 11:59:25,851][82478] Initializing env for player 5, init_info: {'port': 40501}... +[2023-09-14 11:59:25,860][82513] Initializing env for player 3, init_info: {'port': 41001}... +[2023-09-14 11:59:25,879][82513] Initializing env for player 4, init_info: {'port': 41001}... +[2023-09-14 11:59:25,886][82476] Initializing env for player 5, init_info: {'port': 40300}... +[2023-09-14 11:59:25,896][82480] Initializing env for player 3, init_info: {'port': 40801}... +[2023-09-14 11:59:25,898][82512] Initializing env for player 3, init_info: {'port': 40701}... +[2023-09-14 11:59:25,902][82514] Initializing env for player 5, init_info: {'port': 40901}... +[2023-09-14 11:59:25,905][82478] Initializing env for player 6, init_info: {'port': 40501}... +[2023-09-14 11:59:25,911][82479] Initializing env for player 3, init_info: {'port': 40601}... +[2023-09-14 11:59:25,927][82513] Initializing env for player 5, init_info: {'port': 41001}... +[2023-09-14 11:59:25,939][82476] Initializing env for player 6, init_info: {'port': 40300}... +[2023-09-14 11:59:25,951][82512] Initializing env for player 4, init_info: {'port': 40701}... +[2023-09-14 11:59:25,956][82480] Initializing env for player 4, init_info: {'port': 40801}... +[2023-09-14 11:59:25,958][82478] Initializing env for player 7, init_info: {'port': 40501}... +[2023-09-14 11:59:25,959][82514] Initializing env for player 6, init_info: {'port': 40901}... +[2023-09-14 11:59:25,963][82479] Initializing env for player 4, init_info: {'port': 40601}... +[2023-09-14 11:59:25,989][82476] Initializing env for player 7, init_info: {'port': 40300}... +[2023-09-14 11:59:26,007][82514] Initializing env for player 7, init_info: {'port': 40901}... +[2023-09-14 11:59:25,991][82513] Initializing env for player 6, init_info: {'port': 41001}... +[2023-09-14 11:59:26,006][82512] Initializing env for player 5, init_info: {'port': 40701}... +[2023-09-14 11:59:26,008][82480] Initializing env for player 5, init_info: {'port': 40801}... +[2023-09-14 11:59:26,030][82479] Initializing env for player 5, init_info: {'port': 40601}... +[2023-09-14 11:59:26,057][82512] Initializing env for player 6, init_info: {'port': 40701}... +[2023-09-14 11:59:26,061][82513] Initializing env for player 7, init_info: {'port': 41001}... +[2023-09-14 11:59:26,063][82480] Initializing env for player 6, init_info: {'port': 40801}... +[2023-09-14 11:59:26,075][82479] Initializing env for player 6, init_info: {'port': 40601}... +[2023-09-14 11:59:26,110][82512] Initializing env for player 7, init_info: {'port': 40701}... +[2023-09-14 11:59:26,122][82479] Initializing env for player 7, init_info: {'port': 40601}... +[2023-09-14 11:59:26,123][82480] Initializing env for player 7, init_info: {'port': 40801}... +[2023-09-14 11:59:26,363][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:59:27,558][82478] Initialized w:2 v:1 player:2 +[2023-09-14 11:59:27,559][82478] Initialized w:2 v:1 player:3 +[2023-09-14 11:59:27,560][82478] Initialized w:2 v:1 player:5 +[2023-09-14 11:59:27,560][82478] Initialized w:2 v:1 player:4 +[2023-09-14 11:59:27,560][82478] Initialized w:2 v:1 player:7 +[2023-09-14 11:59:27,561][82478] Initialized w:2 v:1 player:0 +[2023-09-14 11:59:27,561][82478] Initialized w:2 v:1 player:1 +[2023-09-14 11:59:27,562][82478] Initialized w:2 v:1 player:6 +[2023-09-14 11:59:27,563][82478] 8 agent workers initialized for env 2! +[2023-09-14 11:59:27,609][82478] Decorrelating experience for 32 frames... +[2023-09-14 11:59:27,631][82514] Initialized w:6 v:1 player:4 +[2023-09-14 11:59:27,631][82514] Initialized w:6 v:1 player:2 +[2023-09-14 11:59:27,632][82514] Initialized w:6 v:1 player:6 +[2023-09-14 11:59:27,633][82514] Initialized w:6 v:1 player:7 +[2023-09-14 11:59:27,635][82514] Initialized w:6 v:1 player:3 +[2023-09-14 11:59:27,635][82514] Initialized w:6 v:1 player:1 +[2023-09-14 11:59:27,635][82514] Initialized w:6 v:1 player:5 +[2023-09-14 11:59:27,636][82514] Initialized w:6 v:1 player:0 +[2023-09-14 11:59:27,637][82514] 8 agent workers initialized for env 6! +[2023-09-14 11:59:27,638][82480] Initialized w:5 v:1 player:5 +[2023-09-14 11:59:27,642][82480] Initialized w:5 v:1 player:7 +[2023-09-14 11:59:27,647][82480] Initialized w:5 v:1 player:6 +[2023-09-14 11:59:27,648][82480] Initialized w:5 v:1 player:4 +[2023-09-14 11:59:27,649][82480] Initialized w:5 v:1 player:1 +[2023-09-14 11:59:27,649][82480] Initialized w:5 v:1 player:3 +[2023-09-14 11:59:27,651][82480] Initialized w:5 v:1 player:2 +[2023-09-14 11:59:27,655][82513] Initialized w:7 v:1 player:4 +[2023-09-14 11:59:27,656][82480] Initialized w:5 v:1 player:0 +[2023-09-14 11:59:27,658][82480] 8 agent workers initialized for env 5! +[2023-09-14 11:59:27,659][82513] Initialized w:7 v:1 player:3 +[2023-09-14 11:59:27,660][82513] Initialized w:7 v:1 player:5 +[2023-09-14 11:59:27,660][82513] Initialized w:7 v:1 player:2 +[2023-09-14 11:59:27,661][82513] Initialized w:7 v:1 player:1 +[2023-09-14 11:59:27,662][82479] Initialized w:3 v:1 player:0 +[2023-09-14 11:59:27,663][82513] Initialized w:7 v:1 player:0 +[2023-09-14 11:59:27,664][82513] Initialized w:7 v:1 player:6 +[2023-09-14 11:59:27,664][82479] Initialized w:3 v:1 player:1 +[2023-09-14 11:59:27,665][82479] Initialized w:3 v:1 player:6 +[2023-09-14 11:59:27,665][82513] Initialized w:7 v:1 player:7 +[2023-09-14 11:59:27,665][82479] Initialized w:3 v:1 player:2 +[2023-09-14 11:59:27,665][82479] Initialized w:3 v:1 player:4 +[2023-09-14 11:59:27,666][82479] Initialized w:3 v:1 player:5 +[2023-09-14 11:59:27,666][82479] Initialized w:3 v:1 player:3 +[2023-09-14 11:59:27,667][82513] 8 agent workers initialized for env 7! +[2023-09-14 11:59:27,667][82479] Initialized w:3 v:1 player:7 +[2023-09-14 11:59:27,669][82479] 8 agent workers initialized for env 3! +[2023-09-14 11:59:27,669][82512] Initialized w:4 v:1 player:7 +[2023-09-14 11:59:27,671][82512] Initialized w:4 v:1 player:6 +[2023-09-14 11:59:27,672][82512] Initialized w:4 v:1 player:2 +[2023-09-14 11:59:27,673][82512] Initialized w:4 v:1 player:4 +[2023-09-14 11:59:27,673][82512] Initialized w:4 v:1 player:1 +[2023-09-14 11:59:27,674][82512] Initialized w:4 v:1 player:3 +[2023-09-14 11:59:27,674][82512] Initialized w:4 v:1 player:5 +[2023-09-14 11:59:27,675][82512] Initialized w:4 v:1 player:0 +[2023-09-14 11:59:27,676][82512] 8 agent workers initialized for env 4! +[2023-09-14 11:59:27,691][82514] Decorrelating experience for 32 frames... +[2023-09-14 11:59:27,707][82480] Decorrelating experience for 32 frames... +[2023-09-14 11:59:27,712][82479] Decorrelating experience for 32 frames... +[2023-09-14 11:59:27,756][82512] Decorrelating experience for 32 frames... +[2023-09-14 11:59:27,771][82513] Decorrelating experience for 32 frames... +[2023-09-14 11:59:27,787][82476] Initialized w:0 v:0 player:1 +[2023-09-14 11:59:27,789][82476] Initialized w:0 v:0 player:2 +[2023-09-14 11:59:27,790][82476] Initialized w:0 v:0 player:7 +[2023-09-14 11:59:27,790][82476] Initialized w:0 v:0 player:0 +[2023-09-14 11:59:27,790][82476] Initialized w:0 v:0 player:4 +[2023-09-14 11:59:27,791][82476] Initialized w:0 v:0 player:3 +[2023-09-14 11:59:27,792][82476] Initialized w:0 v:0 player:5 +[2023-09-14 11:59:27,793][82476] Initialized w:0 v:0 player:6 +[2023-09-14 11:59:27,794][82476] 8 agent workers initialized for env 0! +[2023-09-14 11:59:27,835][82476] Decorrelating experience for 0 frames... +[2023-09-14 11:59:27,837][82476] Port 40301 is available +[2023-09-14 11:59:27,837][82476] Using port 40301 +[2023-09-14 11:59:27,838][82476] Initializing env for player 0, init_info: {'port': 40301}... +[2023-09-14 11:59:27,884][82476] Using port 40301 on host... +[2023-09-14 11:59:27,893][82476] Initializing env for player 1, init_info: {'port': 40301}... +[2023-09-14 11:59:27,948][82476] Initializing env for player 2, init_info: {'port': 40301}... +[2023-09-14 11:59:27,999][82476] Initializing env for player 3, init_info: {'port': 40301}... +[2023-09-14 11:59:28,049][82476] Initializing env for player 4, init_info: {'port': 40301}... +[2023-09-14 11:59:28,077][82478] Multi agent env, num agents: 8 +[2023-09-14 11:59:28,094][82514] Multi agent env, num agents: 8 +[2023-09-14 11:59:28,110][82478] Multi agent env, num agents: 8 +[2023-09-14 11:59:28,119][82476] Initializing env for player 5, init_info: {'port': 40301}... +[2023-09-14 11:59:28,122][82479] Multi agent env, num agents: 8 +[2023-09-14 11:59:28,125][82514] Multi agent env, num agents: 8 +[2023-09-14 11:59:28,140][82478] Port 40502 is available +[2023-09-14 11:59:28,140][82478] Using port 40502 +[2023-09-14 11:59:28,141][82478] Initializing env for player 0, init_info: {'port': 40502}... +[2023-09-14 11:59:28,148][82480] Multi agent env, num agents: 8 +[2023-09-14 11:59:28,157][82514] Port 40902 is available +[2023-09-14 11:59:28,157][82514] Using port 40902 +[2023-09-14 11:59:28,158][82514] Initializing env for player 0, init_info: {'port': 40902}... +[2023-09-14 11:59:28,162][82479] Multi agent env, num agents: 8 +[2023-09-14 11:59:28,170][82478] Using port 40502 on host... +[2023-09-14 11:59:28,171][82476] Initializing env for player 6, init_info: {'port': 40301}... +[2023-09-14 11:59:28,179][82480] Multi agent env, num agents: 8 +[2023-09-14 11:59:28,188][82514] Using port 40902 on host... +[2023-09-14 11:59:28,191][82478] Initializing env for player 1, init_info: {'port': 40502}... +[2023-09-14 11:59:28,203][82479] Port 40602 is available +[2023-09-14 11:59:28,204][82479] Using port 40602 +[2023-09-14 11:59:28,208][82514] Initializing env for player 1, init_info: {'port': 40902}... +[2023-09-14 11:59:28,210][82480] Port 40802 is available +[2023-09-14 11:59:28,210][82480] Using port 40802 +[2023-09-14 11:59:28,211][82480] Initializing env for player 0, init_info: {'port': 40802}... +[2023-09-14 11:59:28,213][82513] Multi agent env, num agents: 8 +[2023-09-14 11:59:28,215][82512] Multi agent env, num agents: 8 +[2023-09-14 11:59:28,223][82476] Initializing env for player 7, init_info: {'port': 40301}... +[2023-09-14 11:59:28,241][82480] Using port 40802 on host... +[2023-09-14 11:59:28,242][82478] Initializing env for player 2, init_info: {'port': 40502}... +[2023-09-14 11:59:28,244][82513] Multi agent env, num agents: 8 +[2023-09-14 11:59:28,262][82512] Multi agent env, num agents: 8 +[2023-09-14 11:59:28,263][82480] Initializing env for player 1, init_info: {'port': 40802}... +[2023-09-14 11:59:28,267][82514] Initializing env for player 2, init_info: {'port': 40902}... +[2023-09-14 11:59:28,292][82478] Initializing env for player 3, init_info: {'port': 40502}... +[2023-09-14 11:59:28,313][82480] Initializing env for player 2, init_info: {'port': 40802}... +[2023-09-14 11:59:28,319][82514] Initializing env for player 3, init_info: {'port': 40902}... +[2023-09-14 11:59:28,331][82512] Port 40702 is available +[2023-09-14 11:59:28,333][82512] Using port 40702 +[2023-09-14 11:59:28,347][82513] Port 41002 is available +[2023-09-14 11:59:28,347][82513] Using port 41002 +[2023-09-14 11:59:28,348][82513] Initializing env for player 0, init_info: {'port': 41002}... +[2023-09-14 11:59:28,355][82478] Initializing env for player 4, init_info: {'port': 40502}... +[2023-09-14 11:59:28,367][82514] Initializing env for player 4, init_info: {'port': 40902}... +[2023-09-14 11:59:28,371][82480] Initializing env for player 3, init_info: {'port': 40802}... +[2023-09-14 11:59:28,377][82513] Using port 41002 on host... +[2023-09-14 11:59:28,399][82513] Initializing env for player 1, init_info: {'port': 41002}... +[2023-09-14 11:59:28,407][82478] Initializing env for player 5, init_info: {'port': 40502}... +[2023-09-14 11:59:28,423][82514] Initializing env for player 5, init_info: {'port': 40902}... +[2023-09-14 11:59:28,427][82480] Initializing env for player 4, init_info: {'port': 40802}... +[2023-09-14 11:59:28,449][82513] Initializing env for player 2, init_info: {'port': 41002}... +[2023-09-14 11:59:28,463][82478] Initializing env for player 6, init_info: {'port': 40502}... +[2023-09-14 11:59:28,475][82514] Initializing env for player 6, init_info: {'port': 40902}... +[2023-09-14 11:59:28,491][82480] Initializing env for player 5, init_info: {'port': 40802}... +[2023-09-14 11:59:28,499][82513] Initializing env for player 3, init_info: {'port': 41002}... +[2023-09-14 11:59:28,515][82478] Initializing env for player 7, init_info: {'port': 40502}... +[2023-09-14 11:59:28,527][82514] Initializing env for player 7, init_info: {'port': 40902}... +[2023-09-14 11:59:28,550][82513] Initializing env for player 4, init_info: {'port': 41002}... +[2023-09-14 11:59:28,551][82480] Initializing env for player 6, init_info: {'port': 40802}... +[2023-09-14 11:59:28,611][82480] Initializing env for player 7, init_info: {'port': 40802}... +[2023-09-14 11:59:28,612][82513] Initializing env for player 5, init_info: {'port': 41002}... +[2023-09-14 11:59:28,659][82513] Initializing env for player 6, init_info: {'port': 41002}... +[2023-09-14 11:59:28,711][82513] Initializing env for player 7, init_info: {'port': 41002}... +[2023-09-14 11:59:29,709][82476] Initialized w:0 v:1 player:0 +[2023-09-14 11:59:29,711][82476] Initialized w:0 v:1 player:6 +[2023-09-14 11:59:29,712][82476] Initialized w:0 v:1 player:5 +[2023-09-14 11:59:29,712][82476] Initialized w:0 v:1 player:2 +[2023-09-14 11:59:29,713][82476] Initialized w:0 v:1 player:1 +[2023-09-14 11:59:29,713][82476] Initialized w:0 v:1 player:7 +[2023-09-14 11:59:29,713][82476] Initialized w:0 v:1 player:4 +[2023-09-14 11:59:29,713][82476] Initialized w:0 v:1 player:3 +[2023-09-14 11:59:29,715][82476] 8 agent workers initialized for env 0! +[2023-09-14 11:59:29,772][82476] Decorrelating experience for 32 frames... +[2023-09-14 11:59:29,951][82514] Initialized w:6 v:2 player:1 +[2023-09-14 11:59:29,953][82514] Initialized w:6 v:2 player:3 +[2023-09-14 11:59:29,953][82514] Initialized w:6 v:2 player:6 +[2023-09-14 11:59:29,953][82514] Initialized w:6 v:2 player:4 +[2023-09-14 11:59:29,953][82514] Initialized w:6 v:2 player:2 +[2023-09-14 11:59:29,956][82478] Initialized w:2 v:2 player:6 +[2023-09-14 11:59:29,954][82514] Initialized w:6 v:2 player:7 +[2023-09-14 11:59:29,956][82514] Initialized w:6 v:2 player:5 +[2023-09-14 11:59:29,957][82478] Initialized w:2 v:2 player:1 +[2023-09-14 11:59:29,957][82514] Initialized w:6 v:2 player:0 +[2023-09-14 11:59:29,958][82478] Initialized w:2 v:2 player:5 +[2023-09-14 11:59:29,958][82478] Initialized w:2 v:2 player:0 +[2023-09-14 11:59:29,958][82478] Initialized w:2 v:2 player:7 +[2023-09-14 11:59:29,959][82514] 8 agent workers initialized for env 6! +[2023-09-14 11:59:29,958][82478] Initialized w:2 v:2 player:2 +[2023-09-14 11:59:29,959][82480] Initialized w:5 v:2 player:3 +[2023-09-14 11:59:29,959][82478] Initialized w:2 v:2 player:3 +[2023-09-14 11:59:29,959][82478] Initialized w:2 v:2 player:4 +[2023-09-14 11:59:29,960][82480] Initialized w:5 v:2 player:5 +[2023-09-14 11:59:29,961][82478] 8 agent workers initialized for env 2! +[2023-09-14 11:59:29,961][82480] Initialized w:5 v:2 player:2 +[2023-09-14 11:59:29,961][82480] Initialized w:5 v:2 player:4 +[2023-09-14 11:59:29,962][82480] Initialized w:5 v:2 player:7 +[2023-09-14 11:59:29,962][82480] Initialized w:5 v:2 player:6 +[2023-09-14 11:59:29,962][82480] Initialized w:5 v:2 player:1 +[2023-09-14 11:59:29,962][82480] Initialized w:5 v:2 player:0 +[2023-09-14 11:59:29,964][82480] 8 agent workers initialized for env 5! +[2023-09-14 11:59:29,970][82479] Initializing env for player 0, init_info: {'port': 40602}... +[2023-09-14 11:59:29,989][82478] Decorrelating experience for 64 frames... +[2023-09-14 11:59:30,001][82512] Initializing env for player 0, init_info: {'port': 40702}... +[2023-09-14 11:59:30,012][82480] Decorrelating experience for 64 frames... +[2023-09-14 11:59:30,015][82479] Using port 40602 on host... +[2023-09-14 11:59:30,026][82479] Initializing env for player 1, init_info: {'port': 40602}... +[2023-09-14 11:59:30,030][82514] Decorrelating experience for 64 frames... +[2023-09-14 11:59:30,038][82512] Using port 40702 on host... +[2023-09-14 11:59:30,048][82513] Initialized w:7 v:2 player:1 +[2023-09-14 11:59:30,049][82513] Initialized w:7 v:2 player:3 +[2023-09-14 11:59:30,050][82513] Initialized w:7 v:2 player:2 +[2023-09-14 11:59:30,050][82513] Initialized w:7 v:2 player:7 +[2023-09-14 11:59:30,051][82513] Initialized w:7 v:2 player:0 +[2023-09-14 11:59:30,051][82512] Initializing env for player 1, init_info: {'port': 40702}... +[2023-09-14 11:59:30,051][82513] Initialized w:7 v:2 player:5 +[2023-09-14 11:59:30,054][82513] Initialized w:7 v:2 player:6 +[2023-09-14 11:59:30,054][82513] Initialized w:7 v:2 player:4 +[2023-09-14 11:59:30,055][82513] 8 agent workers initialized for env 7! +[2023-09-14 11:59:30,081][82479] Initializing env for player 2, init_info: {'port': 40602}... +[2023-09-14 11:59:30,087][82513] Decorrelating experience for 64 frames... +[2023-09-14 11:59:30,104][82512] Initializing env for player 2, init_info: {'port': 40702}... +[2023-09-14 11:59:30,140][82479] Initializing env for player 3, init_info: {'port': 40602}... +[2023-09-14 11:59:30,147][82476] Multi agent env, num agents: 8 +[2023-09-14 11:59:30,157][82512] Initializing env for player 3, init_info: {'port': 40702}... +[2023-09-14 11:59:30,185][82476] Multi agent env, num agents: 8 +[2023-09-14 11:59:30,191][82479] Initializing env for player 4, init_info: {'port': 40602}... +[2023-09-14 11:59:30,207][82512] Initializing env for player 4, init_info: {'port': 40702}... +[2023-09-14 11:59:30,232][82476] Port 40302 is available +[2023-09-14 11:59:30,232][82476] Using port 40302 +[2023-09-14 11:59:30,232][82476] Initializing env for player 0, init_info: {'port': 40302}... +[2023-09-14 11:59:30,243][82479] Initializing env for player 5, init_info: {'port': 40602}... +[2023-09-14 11:59:30,260][82512] Initializing env for player 5, init_info: {'port': 40702}... +[2023-09-14 11:59:30,277][82476] Using port 40302 on host... +[2023-09-14 11:59:30,288][82476] Initializing env for player 1, init_info: {'port': 40302}... +[2023-09-14 11:59:30,299][82479] Initializing env for player 6, init_info: {'port': 40602}... +[2023-09-14 11:59:30,319][82512] Initializing env for player 6, init_info: {'port': 40702}... +[2023-09-14 11:59:30,345][82476] Initializing env for player 2, init_info: {'port': 40302}... +[2023-09-14 11:59:30,363][82479] Initializing env for player 7, init_info: {'port': 40602}... +[2023-09-14 11:59:30,367][82512] Initializing env for player 7, init_info: {'port': 40702}... +[2023-09-14 11:59:30,395][82476] Initializing env for player 3, init_info: {'port': 40302}... +[2023-09-14 11:59:30,451][82476] Initializing env for player 4, init_info: {'port': 40302}... +[2023-09-14 11:59:30,523][82476] Initializing env for player 5, init_info: {'port': 40302}... +[2023-09-14 11:59:30,579][82476] Initializing env for player 6, init_info: {'port': 40302}... +[2023-09-14 11:59:30,663][82476] Initializing env for player 7, init_info: {'port': 40302}... +[2023-09-14 11:59:30,890][82478] Port 40503 is available +[2023-09-14 11:59:30,891][82478] Using port 40503 +[2023-09-14 11:59:30,891][82478] Initializing env for player 0, init_info: {'port': 40503}... +[2023-09-14 11:59:30,918][82513] Port 41003 is available +[2023-09-14 11:59:30,918][82513] Using port 41003 +[2023-09-14 11:59:30,918][82513] Initializing env for player 0, init_info: {'port': 41003}... +[2023-09-14 11:59:30,920][82478] Using port 40503 on host... +[2023-09-14 11:59:30,923][82514] Port 40903 is available +[2023-09-14 11:59:30,923][82514] Using port 40903 +[2023-09-14 11:59:30,924][82514] Initializing env for player 0, init_info: {'port': 40903}... +[2023-09-14 11:59:30,942][82478] Initializing env for player 1, init_info: {'port': 40503}... +[2023-09-14 11:59:30,948][82513] Using port 41003 on host... +[2023-09-14 11:59:30,966][82514] Using port 40903 on host... +[2023-09-14 11:59:30,969][82513] Initializing env for player 1, init_info: {'port': 41003}... +[2023-09-14 11:59:30,980][82514] Initializing env for player 1, init_info: {'port': 40903}... +[2023-09-14 11:59:30,999][82478] Initializing env for player 2, init_info: {'port': 40503}... +[2023-09-14 11:59:31,020][82513] Initializing env for player 2, init_info: {'port': 41003}... +[2023-09-14 11:59:31,038][82480] Port 40803 is available +[2023-09-14 11:59:31,038][82480] Using port 40803 +[2023-09-14 11:59:31,039][82480] Initializing env for player 0, init_info: {'port': 40803}... +[2023-09-14 11:59:31,041][82514] Initializing env for player 2, init_info: {'port': 40903}... +[2023-09-14 11:59:31,063][82478] Initializing env for player 3, init_info: {'port': 40503}... +[2023-09-14 11:59:31,068][82480] Using port 40803 on host... +[2023-09-14 11:59:31,071][82513] Initializing env for player 3, init_info: {'port': 41003}... +[2023-09-14 11:59:31,089][82480] Initializing env for player 1, init_info: {'port': 40803}... +[2023-09-14 11:59:31,103][82478] Initializing env for player 4, init_info: {'port': 40503}... +[2023-09-14 11:59:31,103][82514] Initializing env for player 3, init_info: {'port': 40903}... +[2023-09-14 11:59:31,139][82513] Initializing env for player 4, init_info: {'port': 41003}... +[2023-09-14 11:59:31,143][82480] Initializing env for player 2, init_info: {'port': 40803}... +[2023-09-14 11:59:31,154][82514] Initializing env for player 4, init_info: {'port': 40903}... +[2023-09-14 11:59:31,163][82478] Initializing env for player 5, init_info: {'port': 40503}... +[2023-09-14 11:59:31,170][82513] Initializing env for player 5, init_info: {'port': 41003}... +[2023-09-14 11:59:31,215][82480] Initializing env for player 3, init_info: {'port': 40803}... +[2023-09-14 11:59:31,217][82514] Initializing env for player 5, init_info: {'port': 40903}... +[2023-09-14 11:59:31,223][82478] Initializing env for player 6, init_info: {'port': 40503}... +[2023-09-14 11:59:31,239][82513] Initializing env for player 6, init_info: {'port': 41003}... +[2023-09-14 11:59:31,267][82480] Initializing env for player 4, init_info: {'port': 40803}... +[2023-09-14 11:59:31,271][82514] Initializing env for player 6, init_info: {'port': 40903}... +[2023-09-14 11:59:31,275][82478] Initializing env for player 7, init_info: {'port': 40503}... +[2023-09-14 11:59:31,319][82480] Initializing env for player 5, init_info: {'port': 40803}... +[2023-09-14 11:59:31,323][82514] Initializing env for player 7, init_info: {'port': 40903}... +[2023-09-14 11:59:31,323][82513] Initializing env for player 7, init_info: {'port': 41003}... +[2023-09-14 11:59:31,363][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:59:31,375][82480] Initializing env for player 6, init_info: {'port': 40803}... +[2023-09-14 11:59:31,471][82480] Initializing env for player 7, init_info: {'port': 40803}... +[2023-09-14 11:59:31,606][82479] Initialized w:3 v:2 player:1 +[2023-09-14 11:59:31,607][82479] Initialized w:3 v:2 player:0 +[2023-09-14 11:59:31,608][82479] Initialized w:3 v:2 player:5 +[2023-09-14 11:59:31,609][82479] Initialized w:3 v:2 player:4 +[2023-09-14 11:59:31,609][82479] Initialized w:3 v:2 player:7 +[2023-09-14 11:59:31,610][82479] Initialized w:3 v:2 player:6 +[2023-09-14 11:59:31,610][82479] Initialized w:3 v:2 player:3 +[2023-09-14 11:59:31,611][82479] Initialized w:3 v:2 player:2 +[2023-09-14 11:59:31,612][82479] 8 agent workers initialized for env 3! +[2023-09-14 11:59:31,661][82479] Decorrelating experience for 64 frames... +[2023-09-14 11:59:31,877][82512] Initialized w:4 v:2 player:0 +[2023-09-14 11:59:31,879][82512] Initialized w:4 v:2 player:3 +[2023-09-14 11:59:31,880][82512] Initialized w:4 v:2 player:5 +[2023-09-14 11:59:31,881][82512] Initialized w:4 v:2 player:1 +[2023-09-14 11:59:31,882][82512] Initialized w:4 v:2 player:4 +[2023-09-14 11:59:31,882][82512] Initialized w:4 v:2 player:2 +[2023-09-14 11:59:31,883][82512] Initialized w:4 v:2 player:7 +[2023-09-14 11:59:31,884][82512] Initialized w:4 v:2 player:6 +[2023-09-14 11:59:31,885][82512] 8 agent workers initialized for env 4! +[2023-09-14 11:59:31,944][82512] Decorrelating experience for 64 frames... +[2023-09-14 11:59:32,079][82476] Initialized w:0 v:2 player:4 +[2023-09-14 11:59:32,079][82476] Initialized w:0 v:2 player:5 +[2023-09-14 11:59:32,080][82476] Initialized w:0 v:2 player:2 +[2023-09-14 11:59:32,080][82476] Initialized w:0 v:2 player:1 +[2023-09-14 11:59:32,080][82476] Initialized w:0 v:2 player:6 +[2023-09-14 11:59:32,080][82476] Initialized w:0 v:2 player:3 +[2023-09-14 11:59:32,080][82476] Initialized w:0 v:2 player:7 +[2023-09-14 11:59:32,081][82476] Initialized w:0 v:2 player:0 +[2023-09-14 11:59:32,084][82476] 8 agent workers initialized for env 0! +[2023-09-14 11:59:32,134][82476] Decorrelating experience for 64 frames... +[2023-09-14 11:59:32,602][82512] Port 40703 is available +[2023-09-14 11:59:32,407][82479] Port 40603 is available +[2023-09-14 11:59:32,890][82512] Using port 40703 +[2023-09-14 11:59:32,890][82479] Using port 40603 +[2023-09-14 11:59:32,891][82479] Initializing env for player 0, init_info: {'port': 40603}... +[2023-09-14 11:59:32,924][82479] Using port 40603 on host... +[2023-09-14 11:59:32,942][82479] Initializing env for player 1, init_info: {'port': 40603}... +[2023-09-14 11:59:32,960][82476] Port 40303 is available +[2023-09-14 11:59:32,960][82476] Using port 40303 +[2023-09-14 11:59:32,961][82476] Initializing env for player 0, init_info: {'port': 40303}... +[2023-09-14 11:59:32,990][82476] Using port 40303 on host... +[2023-09-14 11:59:32,993][82479] Initializing env for player 2, init_info: {'port': 40603}... +[2023-09-14 11:59:33,012][82476] Initializing env for player 1, init_info: {'port': 40303}... +[2023-09-14 11:59:33,053][82479] Initializing env for player 3, init_info: {'port': 40603}... +[2023-09-14 11:59:33,062][82476] Initializing env for player 2, init_info: {'port': 40303}... +[2023-09-14 11:59:33,108][82479] Initializing env for player 4, init_info: {'port': 40603}... +[2023-09-14 11:59:33,119][82476] Initializing env for player 3, init_info: {'port': 40303}... +[2023-09-14 11:59:33,163][82479] Initializing env for player 5, init_info: {'port': 40603}... +[2023-09-14 11:59:33,168][82476] Initializing env for player 4, init_info: {'port': 40303}... +[2023-09-14 11:59:33,211][82479] Initializing env for player 6, init_info: {'port': 40603}... +[2023-09-14 11:59:33,223][82476] Initializing env for player 5, init_info: {'port': 40303}... +[2023-09-14 11:59:33,267][82479] Initializing env for player 7, init_info: {'port': 40603}... +[2023-09-14 11:59:33,291][82476] Initializing env for player 6, init_info: {'port': 40303}... +[2023-09-14 11:59:33,339][82513] Initialized w:7 v:3 player:4 +[2023-09-14 11:59:33,347][82476] Initializing env for player 7, init_info: {'port': 40303}... +[2023-09-14 11:59:33,341][82513] Initialized w:7 v:3 player:2 +[2023-09-14 11:59:33,341][82513] Initialized w:7 v:3 player:6 +[2023-09-14 11:59:33,342][82513] Initialized w:7 v:3 player:3 +[2023-09-14 11:59:33,342][82513] Initialized w:7 v:3 player:1 +[2023-09-14 11:59:33,343][82513] Initialized w:7 v:3 player:7 +[2023-09-14 11:59:33,347][82513] Initialized w:7 v:3 player:0 +[2023-09-14 11:59:34,425][82478] Initialized w:2 v:3 player:2 +[2023-09-14 11:59:34,427][82478] Initialized w:2 v:3 player:7 +[2023-09-14 11:59:34,428][82478] Initialized w:2 v:3 player:4 +[2023-09-14 11:59:34,428][82478] Initialized w:2 v:3 player:0 +[2023-09-14 11:59:34,430][82478] Initialized w:2 v:3 player:3 +[2023-09-14 11:59:34,430][82478] Initialized w:2 v:3 player:1 +[2023-09-14 11:59:34,431][82478] Initialized w:2 v:3 player:6 +[2023-09-14 11:59:34,509][82514] Initialized w:6 v:3 player:4 +[2023-09-14 11:59:34,510][82514] Initialized w:6 v:3 player:0 +[2023-09-14 11:59:34,511][82514] Initialized w:6 v:3 player:3 +[2023-09-14 11:59:34,511][82514] Initialized w:6 v:3 player:6 +[2023-09-14 11:59:34,512][82514] Initialized w:6 v:3 player:1 +[2023-09-14 11:59:34,512][82514] Initialized w:6 v:3 player:5 +[2023-09-14 11:59:34,512][82514] Initialized w:6 v:3 player:7 +[2023-09-14 11:59:34,512][82514] Initialized w:6 v:3 player:2 +[2023-09-14 11:59:34,514][82514] 8 agent workers initialized for env 6! +[2023-09-14 11:59:34,532][82480] Initialized w:5 v:3 player:1 +[2023-09-14 11:59:34,534][82480] Initialized w:5 v:3 player:3 +[2023-09-14 11:59:34,535][82480] Initialized w:5 v:3 player:7 +[2023-09-14 11:59:34,535][82480] Initialized w:5 v:3 player:4 +[2023-09-14 11:59:34,535][82480] Initialized w:5 v:3 player:0 +[2023-09-14 11:59:34,536][82480] Initialized w:5 v:3 player:2 +[2023-09-14 11:59:34,537][82480] Initialized w:5 v:3 player:6 +[2023-09-14 11:59:34,537][82480] Initialized w:5 v:3 player:5 +[2023-09-14 11:59:34,539][82480] 8 agent workers initialized for env 5! +[2023-09-14 11:59:34,553][82514] Decorrelating experience for 96 frames... +[2023-09-14 11:59:34,589][82480] Decorrelating experience for 96 frames... +[2023-09-14 11:59:35,175][82479] Initialized w:3 v:3 player:1 +[2023-09-14 11:59:35,176][82479] Initialized w:3 v:3 player:6 +[2023-09-14 11:59:35,176][82479] Initialized w:3 v:3 player:2 +[2023-09-14 11:59:35,177][82479] Initialized w:3 v:3 player:5 +[2023-09-14 11:59:35,177][82479] Initialized w:3 v:3 player:3 +[2023-09-14 11:59:35,177][82479] Initialized w:3 v:3 player:0 +[2023-09-14 11:59:35,178][82479] Initialized w:3 v:3 player:4 +[2023-09-14 11:59:35,179][82479] Initialized w:3 v:3 player:7 +[2023-09-14 11:59:35,180][82479] 8 agent workers initialized for env 3! +[2023-09-14 11:59:35,217][82479] Decorrelating experience for 96 frames... +[2023-09-14 11:59:35,425][82478] Initialized w:2 v:3 player:5 +[2023-09-14 11:59:35,425][82478] 8 agent workers initialized for env 2! +[2023-09-14 11:59:35,489][82478] Decorrelating experience for 96 frames... +[2023-09-14 11:59:35,682][82476] Initialized w:0 v:3 player:5 +[2023-09-14 11:59:35,683][82476] Initialized w:0 v:3 player:4 +[2023-09-14 11:59:35,683][82476] Initialized w:0 v:3 player:7 +[2023-09-14 11:59:35,682][82476] Initialized w:0 v:3 player:1 +[2023-09-14 11:59:35,682][82476] Initialized w:0 v:3 player:2 +[2023-09-14 11:59:35,685][82476] Initialized w:0 v:3 player:6 +[2023-09-14 11:59:35,685][82476] Initialized w:0 v:3 player:0 +[2023-09-14 11:59:35,686][82476] Initialized w:0 v:3 player:3 +[2023-09-14 11:59:35,688][82476] 8 agent workers initialized for env 0! +[2023-09-14 11:59:35,743][82476] Decorrelating experience for 96 frames... +[2023-09-14 11:59:36,363][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:59:38,126][82394] Signal inference workers to stop experience collection... +[2023-09-14 11:59:38,147][82475] InferenceWorker_p0-w0: stopping experience collection +[2023-09-14 11:59:38,693][97397] Heartbeat connected on Batcher_0 +[2023-09-14 11:59:38,700][97397] Heartbeat connected on InferenceWorker_p0-w0 +[2023-09-14 11:59:38,705][97397] Heartbeat connected on RolloutWorker_w0 +[2023-09-14 11:59:38,711][97397] Heartbeat connected on RolloutWorker_w2 +[2023-09-14 11:59:38,714][97397] Heartbeat connected on RolloutWorker_w3 +[2023-09-14 11:59:38,720][97397] Heartbeat connected on RolloutWorker_w5 +[2023-09-14 11:59:38,723][97397] Heartbeat connected on RolloutWorker_w6 +[2023-09-14 11:59:39,164][82394] EvtLoop [learner_proc0_evt_loop, process=learner_proc0] unhandled exception in slot='on_new_training_batch' connected to emitter=Emitter(object_id='Batcher_0', signal_name='training_batches_available'), args=(0,) +Traceback (most recent call last): + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py", line 355, in _process_signal + slot_callable(*args) + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner_worker.py", line 150, in on_new_training_batch + stats = self.learner.train(self.batcher.training_batches[batch_idx]) + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 1046, in train + train_stats = self._train(buff, self.cfg.batch_size, experience_size, num_invalids) + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 731, in _train + ) = self._calculate_losses(mb, num_invalids) + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 649, in _calculate_losses + exploration_loss = self.exploration_loss_func(action_distribution, valids, num_invalids) + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 477, in _symmetric_kl_exploration_loss + kl_prior = action_distribution.symmetric_kl_with_uniform_prior() + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py", line 247, in symmetric_kl_with_uniform_prior + sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions] + File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py", line 247, in + sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions] +AttributeError: 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' +[2023-09-14 11:59:39,165][82394] Unhandled exception 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' in evt loop learner_proc0_evt_loop +[2023-09-14 11:59:41,363][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 242.9. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:59:42,913][82512] Port 40703 is available +[2023-09-14 11:59:42,914][82512] Using port 40703 +[2023-09-14 11:59:42,915][82512] Initializing env for player 0, init_info: {'port': 40703}... +[2023-09-14 11:59:42,949][82512] Using port 40703 on host... +[2023-09-14 11:59:42,965][82512] Initializing env for player 1, init_info: {'port': 40703}... +[2023-09-14 11:59:43,016][82512] Initializing env for player 2, init_info: {'port': 40703}... +[2023-09-14 11:59:43,066][82512] Initializing env for player 3, init_info: {'port': 40703}... +[2023-09-14 11:59:43,119][82512] Initializing env for player 4, init_info: {'port': 40703}... +[2023-09-14 11:59:43,171][82512] Initializing env for player 5, init_info: {'port': 40703}... +[2023-09-14 11:59:43,219][82512] Initializing env for player 6, init_info: {'port': 40703}... +[2023-09-14 11:59:43,275][82512] Initializing env for player 7, init_info: {'port': 40703}... +[2023-09-14 11:59:43,477][97397] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 97397], exiting... +[2023-09-14 11:59:43,480][82394] Stopping Batcher_0... +[2023-09-14 11:59:43,481][82394] Loop batcher_evt_loop terminating... +[2023-09-14 11:59:43,480][97397] Runner profile tree view: +main_loop: 24.7527 +[2023-09-14 11:59:43,481][97397] Collected {0: 0}, FPS: 0.0 +[2023-09-14 11:59:43,497][82475] Weights refcount: 2 0 +[2023-09-14 11:59:43,498][82475] Stopping InferenceWorker_p0-w0... +[2023-09-14 11:59:43,498][82475] Loop inference_proc0-0_evt_loop terminating... +[2023-09-14 11:59:44,601][82512] Initialized w:4 v:3 player:7 +[2023-09-14 11:59:44,602][82512] Initialized w:4 v:3 player:2 +[2023-09-14 11:59:44,603][82512] Initialized w:4 v:3 player:5 +[2023-09-14 11:59:44,604][82512] Initialized w:4 v:3 player:1 +[2023-09-14 11:59:44,604][82512] Initialized w:4 v:3 player:0 +[2023-09-14 11:59:44,604][82512] Initialized w:4 v:3 player:3 +[2023-09-14 11:59:44,605][82512] Initialized w:4 v:3 player:4 +[2023-09-14 11:59:44,605][82512] Initialized w:4 v:3 player:6 +[2023-09-14 11:59:44,606][82512] 8 agent workers initialized for env 4! +[2023-09-14 11:59:44,651][82512] Decorrelating experience for 96 frames... +[2023-09-14 11:59:46,696][82478] Stopping RolloutWorker_w2... +[2023-09-14 11:59:46,696][82478] Loop rollout_proc2_evt_loop terminating... +[2023-09-14 11:59:46,697][82479] Stopping RolloutWorker_w3... +[2023-09-14 11:59:46,697][82479] Loop rollout_proc3_evt_loop terminating... +[2023-09-14 11:59:46,701][82476] Stopping RolloutWorker_w0... +[2023-09-14 11:59:46,702][82476] Loop rollout_proc0_evt_loop terminating... +[2023-09-14 11:59:46,703][82514] Stopping RolloutWorker_w6... +[2023-09-14 11:59:46,703][82514] Loop rollout_proc6_evt_loop terminating... +[2023-09-14 11:59:46,718][82480] Stopping RolloutWorker_w5... +[2023-09-14 11:59:46,718][82480] Loop rollout_proc5_evt_loop terminating... +[2023-09-14 11:59:48,297][97397] Environment doom_basic already registered, overwriting... +[2023-09-14 11:59:48,299][97397] Environment doom_two_colors_easy already registered, overwriting... +[2023-09-14 11:59:48,299][97397] Environment doom_two_colors_hard already registered, overwriting... +[2023-09-14 11:59:48,305][97397] Environment doom_dm already registered, overwriting... +[2023-09-14 11:59:48,305][97397] Environment doom_dwango5 already registered, overwriting... +[2023-09-14 11:59:48,306][97397] Environment doom_my_way_home_flat_actions already registered, overwriting... +[2023-09-14 11:59:48,307][97397] Environment doom_defend_the_center_flat_actions already registered, overwriting... +[2023-09-14 11:59:48,308][97397] Environment doom_my_way_home already registered, overwriting... +[2023-09-14 11:59:48,309][97397] Environment doom_deadly_corridor already registered, overwriting... +[2023-09-14 11:59:48,309][97397] Environment doom_defend_the_center already registered, overwriting... +[2023-09-14 11:59:48,310][97397] Environment doom_defend_the_line already registered, overwriting... +[2023-09-14 11:59:48,310][97397] Environment doom_health_gathering already registered, overwriting... +[2023-09-14 11:59:48,311][97397] Environment doom_health_gathering_supreme already registered, overwriting... +[2023-09-14 11:59:48,312][97397] Environment doom_battle already registered, overwriting... +[2023-09-14 11:59:48,312][97397] Environment doom_battle2 already registered, overwriting... +[2023-09-14 11:59:48,313][97397] Environment doom_duel_bots already registered, overwriting... +[2023-09-14 11:59:48,313][97397] Environment doom_deathmatch_bots already registered, overwriting... +[2023-09-14 11:59:48,314][97397] Environment doom_duel already registered, overwriting... +[2023-09-14 11:59:48,314][97397] Environment doom_deathmatch_full already registered, overwriting... +[2023-09-14 11:59:48,315][97397] Environment doom_benchmark already registered, overwriting... +[2023-09-14 11:59:48,315][97397] register_encoder_factory: +[2023-09-14 11:59:48,349][97397] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json +[2023-09-14 11:59:48,350][97397] Overriding arg 'env' with value 'doom_duel' passed from command line +[2023-09-14 11:59:48,355][97397] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists! +[2023-09-14 11:59:48,356][97397] Resuming existing experiment from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment... +[2023-09-14 11:59:48,357][97397] Weights and Biases integration disabled +[2023-09-14 11:59:48,359][97397] Environment var CUDA_VISIBLE_DEVICES is 0,1 + +[2023-09-14 11:59:48,712][82512] Stopping RolloutWorker_w4... +[2023-09-14 11:59:48,713][82512] Loop rollout_proc4_evt_loop terminating... +[2023-09-14 11:59:50,315][97397] Starting experiment with the following configuration: +help=False +algo=APPO +env=doom_duel +experiment=default_experiment +train_dir=/home/cogstack/Documents/optuna/environments/sample_factory/train_dir +restart_behavior=resume +device=gpu +seed=None +num_policies=1 +async_rl=True +serial_mode=False +batched_sampling=False +num_batches_to_accumulate=2 +worker_num_splits=2 +policy_workers_per_policy=1 +max_policy_lag=1000 +num_workers=8 +num_envs_per_worker=4 +batch_size=1024 +num_batches_per_epoch=1 +num_epochs=1 +rollout=32 +recurrence=32 +shuffle_minibatches=False +gamma=0.99 +reward_scale=1.0 +reward_clip=1000.0 +value_bootstrap=False +normalize_returns=True +exploration_loss_coeff=0.001 +value_loss_coeff=0.5 +kl_loss_coeff=0.0 +exploration_loss=symmetric_kl +gae_lambda=0.95 +ppo_clip_ratio=0.1 +ppo_clip_value=0.2 +with_vtrace=False +vtrace_rho=1.0 +vtrace_c=1.0 +optimizer=adam +adam_eps=1e-06 +adam_beta1=0.9 +adam_beta2=0.999 +max_grad_norm=4.0 +learning_rate=0.0001 +lr_schedule=constant +lr_schedule_kl_threshold=0.008 +lr_adaptive_min=1e-06 +lr_adaptive_max=0.01 +obs_subtract_mean=0.0 +obs_scale=255.0 +normalize_input=True +normalize_input_keys=None +decorrelate_experience_max_seconds=0 +decorrelate_envs_on_one_worker=True +actor_worker_gpus=[] +set_workers_cpu_affinity=True +force_envs_single_thread=False +default_niceness=0 +log_to_file=True +experiment_summaries_interval=10 +flush_summaries_interval=30 +stats_avg=100 +summaries_use_frameskip=True +heartbeat_interval=20 +heartbeat_reporting_interval=600 +train_for_env_steps=1000000 +train_for_seconds=10000000000 +save_every_sec=120 +keep_checkpoints=2 +load_checkpoint_kind=latest +save_milestones_sec=-1 +save_best_every_sec=5 +save_best_metric=reward +save_best_after=100000 +benchmark=False +encoder_mlp_layers=[512, 512] +encoder_conv_architecture=convnet_simple +encoder_conv_mlp_layers=[512] +use_rnn=True +rnn_size=512 +rnn_type=gru +rnn_num_layers=1 +decoder_mlp_layers=[] +nonlinearity=elu +policy_initialization=orthogonal +policy_init_gain=1.0 +actor_critic_share_weights=True +adaptive_stddev=True +continuous_tanh_scale=0.0 +initial_stddev=1.0 +use_env_info_cache=False +env_gpu_actions=False +env_gpu_observations=True +env_frameskip=4 +env_framestack=1 +pixel_format=CHW +use_record_episode_statistics=False +with_wandb=False +wandb_user=None +wandb_project=sample_factory +wandb_group=None +wandb_job_type=SF +wandb_tags=[] +with_pbt=False +pbt_mix_policies_in_one_env=True +pbt_period_env_steps=5000000 +pbt_start_mutation=20000000 +pbt_replace_fraction=0.3 +pbt_mutation_rate=0.15 +pbt_replace_reward_gap=0.1 +pbt_replace_reward_gap_absolute=1e-06 +pbt_optimize_gamma=False +pbt_target_objective=true_objective +pbt_perturb_min=1.1 +pbt_perturb_max=1.5 +num_agents=-1 +num_humans=0 +num_bots=-1 +start_bot_difficulty=None +timelimit=None +res_w=128 +res_h=72 +wide_aspect_ratio=False +eval_env_frameskip=1 +fps=35 +command_line=--env=doom_dm --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=20000000 +cli_args={'env': 'doom_dm', 'num_workers': 8, 'num_envs_per_worker': 4, 'train_for_env_steps': 20000000} +git_hash=20b6d44612dad7d171f23e13b1f3b4c5e5631cf9 +git_repo_name=https://github.com/MattStammers/optuna.git +[2023-09-14 11:59:50,316][97397] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... +[2023-09-14 11:59:50,435][97397] Rollout worker 0 uses device cpu +[2023-09-14 11:59:50,436][97397] Rollout worker 1 uses device cpu +[2023-09-14 11:59:50,438][97397] Rollout worker 2 uses device cpu +[2023-09-14 11:59:50,439][97397] Rollout worker 3 uses device cpu +[2023-09-14 11:59:50,439][97397] Rollout worker 4 uses device cpu +[2023-09-14 11:59:50,440][97397] Rollout worker 5 uses device cpu +[2023-09-14 11:59:50,441][97397] Rollout worker 6 uses device cpu +[2023-09-14 11:59:50,442][97397] Rollout worker 7 uses device cpu +[2023-09-14 11:59:50,510][97397] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:59:50,511][97397] InferenceWorker_p0-w0: min num requests: 2 +[2023-09-14 11:59:50,548][97397] Starting all processes... +[2023-09-14 11:59:50,549][97397] Starting process learner_proc0 +[2023-09-14 11:59:52,142][97397] Starting all processes... +[2023-09-14 11:59:52,144][86679] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:59:52,144][86679] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 +[2023-09-14 11:59:52,147][97397] Starting process inference_proc0-0 +[2023-09-14 11:59:52,147][97397] Starting process rollout_proc0 +[2023-09-14 11:59:52,162][86679] Num visible devices: 1 +[2023-09-14 11:59:52,184][86679] Starting seed is not provided +[2023-09-14 11:59:52,184][86679] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:59:52,184][86679] Initializing actor-critic model on device cuda:0 +[2023-09-14 11:59:52,185][86679] RunningMeanStd input shape: (23,) +[2023-09-14 11:59:52,185][86679] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 11:59:52,186][86679] RunningMeanStd input shape: (1,) +[2023-09-14 11:59:52,198][86679] ConvEncoder: input_channels=3 +[2023-09-14 11:59:52,148][97397] Starting process rollout_proc1 +[2023-09-14 11:59:52,149][97397] Starting process rollout_proc2 +[2023-09-14 11:59:52,149][97397] Starting process rollout_proc3 +[2023-09-14 11:59:52,150][97397] Starting process rollout_proc4 +[2023-09-14 11:59:52,150][97397] Starting process rollout_proc5 +[2023-09-14 11:59:52,151][97397] Starting process rollout_proc6 +[2023-09-14 11:59:52,151][97397] Starting process rollout_proc7 +[2023-09-14 11:59:52,413][86679] Conv encoder output size: 512 +[2023-09-14 11:59:52,414][86679] Policy head output size: 640 +[2023-09-14 11:59:52,432][86679] Created Actor Critic model with architecture: +[2023-09-14 11:59:52,432][86679] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (measurements): RunningMeanStdInPlace() + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): VizdoomEncoder( + (basic_encoder): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ELU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ELU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ELU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ELU) + ) + ) + ) + (measurements_head): Sequential( + (0): Linear(in_features=23, out_features=128, bias=True) + (1): ELU(alpha=1.0) + (2): Linear(in_features=128, out_features=128, bias=True) + (3): ELU(alpha=1.0) + ) + ) + (core): ModelCoreRNN( + (core): GRU(640, 512) + ) + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=41, bias=True) + ) +) +[2023-09-14 11:59:53,546][86679] Using optimizer +[2023-09-14 11:59:53,547][86679] No checkpoints found +[2023-09-14 11:59:53,547][86679] Did not load from checkpoint, starting from scratch! +[2023-09-14 11:59:53,547][86679] Initialized policy 0 weights for model version 0 +[2023-09-14 11:59:53,549][86679] LearnerWorker_p0 finished initialization! +[2023-09-14 11:59:53,549][86679] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:59:54,121][86884] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 11:59:54,121][86884] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 +[2023-09-14 11:59:54,139][86884] Num visible devices: 1 +[2023-09-14 11:59:54,166][86886] Worker 2 uses CPU cores [8, 9, 10, 11] +[2023-09-14 11:59:54,286][86887] Worker 3 uses CPU cores [12, 13, 14, 15] +[2023-09-14 11:59:54,324][86892] Worker 6 uses CPU cores [24, 25, 26, 27] +[2023-09-14 11:59:54,403][86890] Worker 5 uses CPU cores [20, 21, 22, 23] +[2023-09-14 11:59:54,483][86885] Worker 0 uses CPU cores [0, 1, 2, 3] +[2023-09-14 11:59:54,535][86889] Worker 4 uses CPU cores [16, 17, 18, 19] +[2023-09-14 11:59:54,556][86888] Worker 1 uses CPU cores [4, 5, 6, 7] +[2023-09-14 11:59:54,569][97397] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 0. Throughput: 0: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:59:54,570][86891] Worker 7 uses CPU cores [28, 29, 30, 31] +[2023-09-14 11:59:54,852][86884] RunningMeanStd input shape: (23,) +[2023-09-14 11:59:54,853][86884] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 11:59:54,853][86884] RunningMeanStd input shape: (1,) +[2023-09-14 11:59:54,865][86884] ConvEncoder: input_channels=3 +[2023-09-14 11:59:54,968][86884] Conv encoder output size: 512 +[2023-09-14 11:59:54,969][86884] Policy head output size: 640 +[2023-09-14 11:59:55,246][97397] Inference worker 0-0 is ready! +[2023-09-14 11:59:55,248][97397] All inference workers are ready! Signal rollout workers to start! +[2023-09-14 11:59:55,254][86890] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,254][86892] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,254][86886] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,254][86888] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,255][86889] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,255][86885] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,255][86891] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,255][86887] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,287][86890] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:55,287][86889] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:55,287][86892] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:55,288][86886] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:55,289][86888] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:55,290][86890] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,290][86892] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,290][86889] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,291][86886] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,292][86885] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:55,292][86888] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,295][86885] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,307][86891] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:55,307][86887] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 11:59:55,311][86891] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,311][86887] Multi agent env, num agents: 2 +[2023-09-14 11:59:55,320][86892] Port 40900 is available +[2023-09-14 11:59:55,320][86890] Port 40800 is available +[2023-09-14 11:59:55,320][86892] Using port 40900 +[2023-09-14 11:59:55,320][86890] Using port 40800 +[2023-09-14 11:59:55,321][86886] Port 40500 is available +[2023-09-14 11:59:55,321][86886] Using port 40500 +[2023-09-14 11:59:55,321][86889] Port 40700 is available +[2023-09-14 11:59:55,321][86889] Using port 40700 +[2023-09-14 11:59:55,321][86892] Initializing env for player 0, init_info: {'port': 40900}... +[2023-09-14 11:59:55,321][86890] Initializing env for player 0, init_info: {'port': 40800}... +[2023-09-14 11:59:55,322][86888] Port 40400 is available +[2023-09-14 11:59:55,322][86888] Using port 40400 +[2023-09-14 11:59:55,322][86889] Initializing env for player 0, init_info: {'port': 40700}... +[2023-09-14 11:59:55,323][86888] Initializing env for player 0, init_info: {'port': 40400}... +[2023-09-14 11:59:55,325][86885] Port 40300 is available +[2023-09-14 11:59:55,325][86885] Using port 40300 +[2023-09-14 11:59:55,326][86885] Initializing env for player 0, init_info: {'port': 40300}... +[2023-09-14 11:59:55,354][86885] Using port 40300 on host... +[2023-09-14 11:59:55,356][86892] Using port 40900 on host... +[2023-09-14 11:59:55,357][86889] Using port 40700 on host... +[2023-09-14 11:59:55,359][86887] Port 40600 is available +[2023-09-14 11:59:55,359][86887] Using port 40600 +[2023-09-14 11:59:55,360][86891] UDP port 41000 cannot be used [Errno 98] Address already in use +[2023-09-14 11:59:55,360][86891] Port 42000 is available +[2023-09-14 11:59:55,360][86887] Initializing env for player 0, init_info: {'port': 40600}... +[2023-09-14 11:59:55,361][86891] Using port 42000 +[2023-09-14 11:59:55,361][86891] Initializing env for player 0, init_info: {'port': 42000}... +[2023-09-14 11:59:55,369][86890] Using port 40800 on host... +[2023-09-14 11:59:55,371][86888] Using port 40400 on host... +[2023-09-14 11:59:55,372][86889] Initializing env for player 1, init_info: {'port': 40700}... +[2023-09-14 11:59:55,375][86892] Initializing env for player 1, init_info: {'port': 40900}... +[2023-09-14 11:59:55,376][86885] Initializing env for player 1, init_info: {'port': 40300}... +[2023-09-14 11:59:55,383][86888] Initializing env for player 1, init_info: {'port': 40400}... +[2023-09-14 11:59:55,408][86887] Using port 40600 on host... +[2023-09-14 11:59:55,409][86891] Using port 42000 on host... +[2023-09-14 11:59:55,411][86887] Initializing env for player 1, init_info: {'port': 40600}... +[2023-09-14 11:59:55,411][86891] Initializing env for player 1, init_info: {'port': 42000}... +[2023-09-14 11:59:55,388][86890] Initializing env for player 1, init_info: {'port': 40800}... +[2023-09-14 11:59:56,430][86892] Initialized w:6 v:0 player:0 +[2023-09-14 11:59:56,431][86892] Initialized w:6 v:0 player:1 +[2023-09-14 11:59:56,433][86892] 2 agent workers initialized for env 6! +[2023-09-14 11:59:56,447][86892] Decorrelating experience for 0 frames... +[2023-09-14 11:59:56,447][86892] Port 40901 is available +[2023-09-14 11:59:56,448][86892] Using port 40901 +[2023-09-14 11:59:56,448][86892] Initializing env for player 0, init_info: {'port': 40901}... +[2023-09-14 11:59:56,483][86892] Using port 40901 on host... +[2023-09-14 11:59:56,499][86892] Initializing env for player 1, init_info: {'port': 40901}... +[2023-09-14 11:59:56,560][86888] Initialized w:1 v:0 player:0 +[2023-09-14 11:59:56,560][86888] Initialized w:1 v:0 player:1 +[2023-09-14 11:59:56,562][86888] 2 agent workers initialized for env 1! +[2023-09-14 11:59:56,562][86889] Initialized w:4 v:0 player:1 +[2023-09-14 11:59:56,563][86889] Initialized w:4 v:0 player:0 +[2023-09-14 11:59:56,565][86889] 2 agent workers initialized for env 4! +[2023-09-14 11:59:56,574][86888] Decorrelating experience for 0 frames... +[2023-09-14 11:59:56,575][86889] Decorrelating experience for 0 frames... +[2023-09-14 11:59:56,576][86888] Port 40401 is available +[2023-09-14 11:59:56,576][86888] Using port 40401 +[2023-09-14 11:59:56,576][86889] Port 40701 is available +[2023-09-14 11:59:56,576][86889] Using port 40701 +[2023-09-14 11:59:56,577][86889] Initializing env for player 0, init_info: {'port': 40701}... +[2023-09-14 11:59:56,579][86885] Initialized w:0 v:0 player:0 +[2023-09-14 11:59:56,580][86885] Initialized w:0 v:0 player:1 +[2023-09-14 11:59:56,580][86891] Initialized w:7 v:0 player:0 +[2023-09-14 11:59:56,581][86885] 2 agent workers initialized for env 0! +[2023-09-14 11:59:56,581][86891] Initialized w:7 v:0 player:1 +[2023-09-14 11:59:56,583][86891] 2 agent workers initialized for env 7! +[2023-09-14 11:59:56,583][86887] Initialized w:3 v:0 player:1 +[2023-09-14 11:59:56,583][86887] Initialized w:3 v:0 player:0 +[2023-09-14 11:59:56,585][86887] 2 agent workers initialized for env 3! +[2023-09-14 11:59:56,591][86885] Decorrelating experience for 0 frames... +[2023-09-14 11:59:56,592][86885] Port 40301 is available +[2023-09-14 11:59:56,592][86885] Using port 40301 +[2023-09-14 11:59:56,592][86885] Initializing env for player 0, init_info: {'port': 40301}... +[2023-09-14 11:59:56,595][86891] Decorrelating experience for 0 frames... +[2023-09-14 11:59:56,595][86887] Decorrelating experience for 0 frames... +[2023-09-14 11:59:56,596][86891] UDP port 41001 cannot be used [Errno 98] Address already in use +[2023-09-14 11:59:56,596][86887] Port 40601 is available +[2023-09-14 11:59:56,596][86887] Using port 40601 +[2023-09-14 11:59:56,596][86891] Port 42001 is available +[2023-09-14 11:59:56,596][86891] Using port 42001 +[2023-09-14 11:59:56,597][86887] Initializing env for player 0, init_info: {'port': 40601}... +[2023-09-14 11:59:56,599][86890] Initialized w:5 v:0 player:0 +[2023-09-14 11:59:56,601][86890] Initialized w:5 v:0 player:1 +[2023-09-14 11:59:56,601][86890] 2 agent workers initialized for env 5! +[2023-09-14 11:59:56,609][86889] Using port 40701 on host... +[2023-09-14 11:59:56,612][86890] Decorrelating experience for 0 frames... +[2023-09-14 11:59:56,613][86890] Port 40801 is available +[2023-09-14 11:59:56,613][86890] Using port 40801 +[2023-09-14 11:59:56,613][86890] Initializing env for player 0, init_info: {'port': 40801}... +[2023-09-14 11:59:56,623][86885] Using port 40301 on host... +[2023-09-14 11:59:56,625][86887] Using port 40601 on host... +[2023-09-14 11:59:56,627][86889] Initializing env for player 1, init_info: {'port': 40701}... +[2023-09-14 11:59:56,643][86890] Using port 40801 on host... +[2023-09-14 11:59:56,643][86885] Initializing env for player 1, init_info: {'port': 40301}... +[2023-09-14 11:59:56,647][86887] Initializing env for player 1, init_info: {'port': 40601}... +[2023-09-14 11:59:56,664][86890] Initializing env for player 1, init_info: {'port': 40801}... +[2023-09-14 11:59:57,531][86892] Initialized w:6 v:1 player:1 +[2023-09-14 11:59:57,532][86892] Initialized w:6 v:1 player:0 +[2023-09-14 11:59:57,534][86892] 2 agent workers initialized for env 6! +[2023-09-14 11:59:57,534][86888] Initializing env for player 0, init_info: {'port': 40401}... +[2023-09-14 11:59:57,543][86892] Decorrelating experience for 32 frames... +[2023-09-14 11:59:57,579][86888] Using port 40401 on host... +[2023-09-14 11:59:57,588][86888] Initializing env for player 1, init_info: {'port': 40401}... +[2023-09-14 11:59:57,611][86892] Multi agent env, num agents: 2 +[2023-09-14 11:59:57,641][86892] Multi agent env, num agents: 2 +[2023-09-14 11:59:57,670][86892] Port 40902 is available +[2023-09-14 11:59:57,670][86892] Using port 40902 +[2023-09-14 11:59:57,670][86892] Initializing env for player 0, init_info: {'port': 40902}... +[2023-09-14 11:59:57,705][86892] Using port 40902 on host... +[2023-09-14 11:59:57,721][86892] Initializing env for player 1, init_info: {'port': 40902}... +[2023-09-14 11:59:57,743][86890] Initialized w:5 v:1 player:0 +[2023-09-14 11:59:57,743][86890] Initialized w:5 v:1 player:1 +[2023-09-14 11:59:57,745][86890] 2 agent workers initialized for env 5! +[2023-09-14 11:59:57,745][86887] Initialized w:3 v:1 player:1 +[2023-09-14 11:59:57,746][86887] Initialized w:3 v:1 player:0 +[2023-09-14 11:59:57,748][86887] 2 agent workers initialized for env 3! +[2023-09-14 11:59:57,753][86886] Initializing env for player 0, init_info: {'port': 40500}... +[2023-09-14 11:59:57,758][86887] Decorrelating experience for 32 frames... +[2023-09-14 11:59:57,760][86890] Decorrelating experience for 32 frames... +[2023-09-14 11:59:57,790][86889] Initialized w:4 v:1 player:0 +[2023-09-14 11:59:57,790][86889] Initialized w:4 v:1 player:1 +[2023-09-14 11:59:57,792][86889] 2 agent workers initialized for env 4! +[2023-09-14 11:59:57,798][86886] Using port 40500 on host... +[2023-09-14 11:59:57,803][86885] Initialized w:0 v:1 player:1 +[2023-09-14 11:59:57,803][86889] Decorrelating experience for 32 frames... +[2023-09-14 11:59:57,804][86885] Initialized w:0 v:1 player:0 +[2023-09-14 11:59:57,805][86885] 2 agent workers initialized for env 0! +[2023-09-14 11:59:57,807][86886] Initializing env for player 1, init_info: {'port': 40500}... +[2023-09-14 11:59:57,811][86891] Initializing env for player 0, init_info: {'port': 42001}... +[2023-09-14 11:59:57,814][86885] Decorrelating experience for 32 frames... +[2023-09-14 11:59:57,843][86887] Multi agent env, num agents: 2 +[2023-09-14 11:59:57,847][86891] Using port 42001 on host... +[2023-09-14 11:59:57,848][86890] Multi agent env, num agents: 2 +[2023-09-14 11:59:57,861][86891] Initializing env for player 1, init_info: {'port': 42001}... +[2023-09-14 11:59:57,880][86889] Multi agent env, num agents: 2 +[2023-09-14 11:59:57,881][86887] Multi agent env, num agents: 2 +[2023-09-14 11:59:57,890][86885] Multi agent env, num agents: 2 +[2023-09-14 11:59:57,894][86890] Multi agent env, num agents: 2 +[2023-09-14 11:59:57,911][86889] Multi agent env, num agents: 2 +[2023-09-14 11:59:57,921][86885] Multi agent env, num agents: 2 +[2023-09-14 11:59:57,924][86887] Port 40602 is available +[2023-09-14 11:59:57,925][86887] Using port 40602 +[2023-09-14 11:59:57,925][86887] Initializing env for player 0, init_info: {'port': 40602}... +[2023-09-14 11:59:57,939][86890] Port 40802 is available +[2023-09-14 11:59:57,939][86890] Using port 40802 +[2023-09-14 11:59:57,942][86889] Port 40702 is available +[2023-09-14 11:59:57,942][86889] Using port 40702 +[2023-09-14 11:59:57,944][86889] Initializing env for player 0, init_info: {'port': 40702}... +[2023-09-14 11:59:57,952][86885] Port 40302 is available +[2023-09-14 11:59:57,953][86885] Using port 40302 +[2023-09-14 11:59:57,954][86885] Initializing env for player 0, init_info: {'port': 40302}... +[2023-09-14 11:59:57,958][86887] Using port 40602 on host... +[2023-09-14 11:59:57,973][86889] Using port 40702 on host... +[2023-09-14 11:59:57,976][86887] Initializing env for player 1, init_info: {'port': 40602}... +[2023-09-14 11:59:57,984][86885] Using port 40302 on host... +[2023-09-14 11:59:57,994][86889] Initializing env for player 1, init_info: {'port': 40702}... +[2023-09-14 11:59:58,003][86885] Initializing env for player 1, init_info: {'port': 40302}... +[2023-09-14 11:59:58,359][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 11:59:58,700][86888] Initialized w:1 v:1 player:1 +[2023-09-14 11:59:58,701][86888] Initialized w:1 v:1 player:0 +[2023-09-14 11:59:58,702][86888] 2 agent workers initialized for env 1! +[2023-09-14 11:59:58,709][86888] Decorrelating experience for 32 frames... +[2023-09-14 11:59:58,774][86888] Multi agent env, num agents: 2 +[2023-09-14 11:59:58,805][86888] Multi agent env, num agents: 2 +[2023-09-14 11:59:58,836][86888] Port 40402 is available +[2023-09-14 11:59:58,836][86888] Using port 40402 +[2023-09-14 11:59:58,837][86888] Initializing env for player 0, init_info: {'port': 40402}... +[2023-09-14 11:59:58,845][86892] Initialized w:6 v:2 player:1 +[2023-09-14 11:59:58,853][86886] Initialized w:2 v:0 player:1 +[2023-09-14 11:59:58,854][86886] Initialized w:2 v:0 player:0 +[2023-09-14 11:59:58,856][86886] 2 agent workers initialized for env 2! +[2023-09-14 11:59:58,869][86886] Decorrelating experience for 0 frames... +[2023-09-14 11:59:58,870][86886] Port 40501 is available +[2023-09-14 11:59:58,870][86886] Using port 40501 +[2023-09-14 11:59:58,871][86888] Using port 40402 on host... +[2023-09-14 11:59:58,887][86888] Initializing env for player 1, init_info: {'port': 40402}... +[2023-09-14 11:59:59,057][86891] Initialized w:7 v:1 player:1 +[2023-09-14 11:59:59,058][86891] Initialized w:7 v:1 player:0 +[2023-09-14 11:59:59,060][86891] 2 agent workers initialized for env 7! +[2023-09-14 11:59:59,075][86891] Decorrelating experience for 32 frames... +[2023-09-14 11:59:59,081][86887] Initialized w:3 v:2 player:0 +[2023-09-14 11:59:59,081][86887] Initialized w:3 v:2 player:1 +[2023-09-14 11:59:59,082][86887] 2 agent workers initialized for env 3! +[2023-09-14 11:59:59,092][86887] Decorrelating experience for 64 frames... +[2023-09-14 11:59:59,100][86890] Initializing env for player 0, init_info: {'port': 40802}... +[2023-09-14 11:59:59,125][86885] Initialized w:0 v:2 player:0 +[2023-09-14 11:59:59,126][86885] Initialized w:0 v:2 player:1 +[2023-09-14 11:59:59,127][86885] 2 agent workers initialized for env 0! +[2023-09-14 11:59:59,137][86885] Decorrelating experience for 64 frames... +[2023-09-14 11:59:59,145][86890] Using port 40802 on host... +[2023-09-14 11:59:59,150][86890] Initializing env for player 1, init_info: {'port': 40802}... +[2023-09-14 11:59:59,152][86891] Multi agent env, num agents: 2 +[2023-09-14 11:59:59,176][86889] Initialized w:4 v:2 player:1 +[2023-09-14 11:59:59,176][86889] Initialized w:4 v:2 player:0 +[2023-09-14 11:59:59,178][86889] 2 agent workers initialized for env 4! +[2023-09-14 11:59:59,184][86891] Multi agent env, num agents: 2 +[2023-09-14 11:59:59,186][86889] Decorrelating experience for 64 frames... +[2023-09-14 11:59:59,223][86891] UDP port 41002 cannot be used [Errno 98] Address already in use +[2023-09-14 11:59:59,223][86891] Port 42002 is available +[2023-09-14 11:59:59,224][86891] Using port 42002 +[2023-09-14 11:59:59,224][86891] Initializing env for player 0, init_info: {'port': 42002}... +[2023-09-14 11:59:59,260][86891] Using port 42002 on host... +[2023-09-14 11:59:59,275][86891] Initializing env for player 1, init_info: {'port': 42002}... +[2023-09-14 11:59:59,308][86885] Port 40303 is available +[2023-09-14 11:59:59,308][86887] Port 40603 is available +[2023-09-14 11:59:59,308][86885] Using port 40303 +[2023-09-14 11:59:59,308][86887] Using port 40603 +[2023-09-14 11:59:59,309][86885] Initializing env for player 0, init_info: {'port': 40303}... +[2023-09-14 11:59:59,309][86887] Initializing env for player 0, init_info: {'port': 40603}... +[2023-09-14 11:59:59,344][86885] Using port 40303 on host... +[2023-09-14 11:59:59,345][86889] Port 40703 is available +[2023-09-14 11:59:59,345][86889] Using port 40703 +[2023-09-14 11:59:59,345][86889] Initializing env for player 0, init_info: {'port': 40703}... +[2023-09-14 11:59:59,355][86887] Using port 40603 on host... +[2023-09-14 11:59:59,359][86885] Initializing env for player 1, init_info: {'port': 40303}... +[2023-09-14 11:59:59,359][86887] Initializing env for player 1, init_info: {'port': 40603}... +[2023-09-14 11:59:59,376][86889] Using port 40703 on host... +[2023-09-14 11:59:59,396][86889] Initializing env for player 1, init_info: {'port': 40703}... +[2023-09-14 11:59:59,845][86892] Initialized w:6 v:2 player:0 +[2023-09-14 11:59:59,847][86892] 2 agent workers initialized for env 6! +[2023-09-14 11:59:59,863][86892] Decorrelating experience for 64 frames... +[2023-09-14 11:59:59,879][86886] Initializing env for player 0, init_info: {'port': 40501}... +[2023-09-14 11:59:59,911][86886] Using port 40501 on host... +[2023-09-14 11:59:59,930][86886] Initializing env for player 1, init_info: {'port': 40501}... +[2023-09-14 11:59:59,959][86888] Initialized w:1 v:2 player:1 +[2023-09-14 11:59:59,960][86888] Initialized w:1 v:2 player:0 +[2023-09-14 11:59:59,961][86888] 2 agent workers initialized for env 1! +[2023-09-14 11:59:59,970][86888] Decorrelating experience for 64 frames... +[2023-09-14 12:00:00,069][86892] Port 40903 is available +[2023-09-14 12:00:00,069][86892] Using port 40903 +[2023-09-14 12:00:00,128][86888] Port 40403 is available +[2023-09-14 12:00:00,129][86888] Using port 40403 +[2023-09-14 12:00:00,129][86888] Initializing env for player 0, init_info: {'port': 40403}... +[2023-09-14 12:00:00,159][86888] Using port 40403 on host... +[2023-09-14 12:00:00,180][86888] Initializing env for player 1, init_info: {'port': 40403}... +[2023-09-14 12:00:00,345][86890] Initialized w:5 v:2 player:1 +[2023-09-14 12:00:00,347][86890] Initialized w:5 v:2 player:0 +[2023-09-14 12:00:00,347][86890] 2 agent workers initialized for env 5! +[2023-09-14 12:00:00,363][86890] Decorrelating experience for 64 frames... +[2023-09-14 12:00:00,373][86892] Initializing env for player 0, init_info: {'port': 40903}... +[2023-09-14 12:00:00,387][86891] Initialized w:7 v:2 player:0 +[2023-09-14 12:00:00,391][86891] Initialized w:7 v:2 player:1 +[2023-09-14 12:00:00,392][86891] 2 agent workers initialized for env 7! +[2023-09-14 12:00:00,404][86891] Decorrelating experience for 64 frames... +[2023-09-14 12:00:00,407][86892] Using port 40903 on host... +[2023-09-14 12:00:00,423][86892] Initializing env for player 1, init_info: {'port': 40903}... +[2023-09-14 12:00:00,482][86885] Initialized w:0 v:3 player:1 +[2023-09-14 12:00:00,483][86885] Initialized w:0 v:3 player:0 +[2023-09-14 12:00:00,484][86885] 2 agent workers initialized for env 0! +[2023-09-14 12:00:00,485][86887] Initialized w:3 v:3 player:1 +[2023-09-14 12:00:00,485][86887] Initialized w:3 v:3 player:0 +[2023-09-14 12:00:00,486][86887] 2 agent workers initialized for env 3! +[2023-09-14 12:00:00,488][86889] Initialized w:4 v:3 player:1 +[2023-09-14 12:00:00,489][86889] Initialized w:4 v:3 player:0 +[2023-09-14 12:00:00,490][86889] 2 agent workers initialized for env 4! +[2023-09-14 12:00:00,496][86887] Decorrelating experience for 96 frames... +[2023-09-14 12:00:00,497][86885] Decorrelating experience for 96 frames... +[2023-09-14 12:00:00,500][86889] Decorrelating experience for 96 frames... +[2023-09-14 12:00:00,517][86890] Port 40803 is available +[2023-09-14 12:00:00,517][86890] Using port 40803 +[2023-09-14 12:00:00,518][86890] Initializing env for player 0, init_info: {'port': 40803}... +[2023-09-14 12:00:00,544][86891] Port 41003 is available +[2023-09-14 12:00:00,544][86891] Using port 41003 +[2023-09-14 12:00:00,545][86891] Initializing env for player 0, init_info: {'port': 41003}... +[2023-09-14 12:00:00,548][86890] Using port 40803 on host... +[2023-09-14 12:00:00,568][86890] Initializing env for player 1, init_info: {'port': 40803}... +[2023-09-14 12:00:00,580][86891] Using port 41003 on host... +[2023-09-14 12:00:00,595][86891] Initializing env for player 1, init_info: {'port': 41003}... +[2023-09-14 12:00:00,974][86886] Initialized w:2 v:1 player:0 +[2023-09-14 12:00:00,975][86886] Initialized w:2 v:1 player:1 +[2023-09-14 12:00:00,976][86886] 2 agent workers initialized for env 2! +[2023-09-14 12:00:00,983][86886] Decorrelating experience for 32 frames... +[2023-09-14 12:00:01,052][86886] Multi agent env, num agents: 2 +[2023-09-14 12:00:01,085][86886] Multi agent env, num agents: 2 +[2023-09-14 12:00:01,175][86886] Port 40502 is available +[2023-09-14 12:00:01,176][86886] Using port 40502 +[2023-09-14 12:00:01,176][86886] Initializing env for player 0, init_info: {'port': 40502}... +[2023-09-14 12:00:01,226][86886] Using port 40502 on host... +[2023-09-14 12:00:01,226][86886] Initializing env for player 1, init_info: {'port': 40502}... +[2023-09-14 12:00:01,277][86888] Initialized w:1 v:3 player:0 +[2023-09-14 12:00:01,279][86888] Initialized w:1 v:3 player:1 +[2023-09-14 12:00:01,281][86888] 2 agent workers initialized for env 1! +[2023-09-14 12:00:01,294][86888] Decorrelating experience for 96 frames... +[2023-09-14 12:00:01,458][86892] Initialized w:6 v:3 player:1 +[2023-09-14 12:00:01,458][86892] Initialized w:6 v:3 player:0 +[2023-09-14 12:00:01,459][86892] 2 agent workers initialized for env 6! +[2023-09-14 12:00:01,469][86892] Decorrelating experience for 96 frames... +[2023-09-14 12:00:01,621][86890] Initialized w:5 v:3 player:1 +[2023-09-14 12:00:01,621][86890] Initialized w:5 v:3 player:0 +[2023-09-14 12:00:01,622][86890] 2 agent workers initialized for env 5! +[2023-09-14 12:00:01,631][86890] Decorrelating experience for 96 frames... +[2023-09-14 12:00:01,667][86891] Initialized w:7 v:3 player:0 +[2023-09-14 12:00:01,668][86891] Initialized w:7 v:3 player:1 +[2023-09-14 12:00:01,669][86891] 2 agent workers initialized for env 7! +[2023-09-14 12:00:01,701][86891] Decorrelating experience for 96 frames... +[2023-09-14 12:00:02,317][86886] Initialized w:2 v:2 player:1 +[2023-09-14 12:00:02,318][86886] Initialized w:2 v:2 player:0 +[2023-09-14 12:00:02,319][86886] 2 agent workers initialized for env 2! +[2023-09-14 12:00:02,321][86679] Signal inference workers to stop experience collection... +[2023-09-14 12:00:02,329][86886] Decorrelating experience for 64 frames... +[2023-09-14 12:00:02,331][86884] InferenceWorker_p0-w0: stopping experience collection +[2023-09-14 12:00:02,441][86886] Port 40503 is available +[2023-09-14 12:00:02,442][86886] Using port 40503 +[2023-09-14 12:00:02,442][86886] Initializing env for player 0, init_info: {'port': 40503}... +[2023-09-14 12:00:02,470][86886] Using port 40503 on host... +[2023-09-14 12:00:02,493][86886] Initializing env for player 1, init_info: {'port': 40503}... +[2023-09-14 12:00:03,359][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 34.6. Samples: 304. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:00:03,530][86886] Initialized w:2 v:3 player:0 +[2023-09-14 12:00:03,531][86886] Initialized w:2 v:3 player:1 +[2023-09-14 12:00:03,534][86886] 2 agent workers initialized for env 2! +[2023-09-14 12:00:03,543][86886] Decorrelating experience for 96 frames... +[2023-09-14 12:00:05,580][86679] Signal inference workers to resume experience collection... +[2023-09-14 12:00:05,580][86884] InferenceWorker_p0-w0: resuming experience collection +[2023-09-14 12:00:08,359][97397] Fps is (10 sec: 2457.6, 60 sec: 1782.1, 300 sec: 1782.1). Total num frames: 24576. Throughput: 0: 362.3. Samples: 4996. Policy #0 lag: (min: 0.0, avg: 1.5, max: 3.0) +[2023-09-14 12:00:09,288][86884] Updated weights for policy 0, policy_version 10 (0.0696) +[2023-09-14 12:00:10,502][97397] Heartbeat connected on Batcher_0 +[2023-09-14 12:00:10,506][97397] Heartbeat connected on LearnerWorker_p0 +[2023-09-14 12:00:10,516][97397] Heartbeat connected on InferenceWorker_p0-w0 +[2023-09-14 12:00:10,524][97397] Heartbeat connected on RolloutWorker_w1 +[2023-09-14 12:00:10,527][97397] Heartbeat connected on RolloutWorker_w2 +[2023-09-14 12:00:10,528][97397] Heartbeat connected on RolloutWorker_w0 +[2023-09-14 12:00:10,533][97397] Heartbeat connected on RolloutWorker_w3 +[2023-09-14 12:00:10,534][97397] Heartbeat connected on RolloutWorker_w4 +[2023-09-14 12:00:10,538][97397] Heartbeat connected on RolloutWorker_w5 +[2023-09-14 12:00:10,541][97397] Heartbeat connected on RolloutWorker_w6 +[2023-09-14 12:00:10,557][97397] Heartbeat connected on RolloutWorker_w7 +[2023-09-14 12:00:12,530][86884] Updated weights for policy 0, policy_version 20 (0.0013) +[2023-09-14 12:00:13,359][97397] Fps is (10 sec: 9011.4, 60 sec: 4795.8, 300 sec: 4795.8). Total num frames: 90112. Throughput: 0: 1275.1. Samples: 23960. Policy #0 lag: (min: 0.0, avg: 0.9, max: 2.0) +[2023-09-14 12:00:15,492][86884] Updated weights for policy 0, policy_version 30 (0.0015) +[2023-09-14 12:00:18,359][97397] Fps is (10 sec: 13517.0, 60 sec: 6714.8, 300 sec: 6714.8). Total num frames: 159744. Throughput: 0: 1457.8. Samples: 34680. Policy #0 lag: (min: 0.0, avg: 1.1, max: 2.0) +[2023-09-14 12:00:18,425][86884] Updated weights for policy 0, policy_version 40 (0.0012) +[2023-09-14 12:00:21,399][86884] Updated weights for policy 0, policy_version 50 (0.0012) +[2023-09-14 12:00:23,359][97397] Fps is (10 sec: 13926.3, 60 sec: 7967.2, 300 sec: 7967.2). Total num frames: 229376. Throughput: 0: 1917.3. Samples: 55200. Policy #0 lag: (min: 0.0, avg: 0.9, max: 3.0) +[2023-09-14 12:00:24,247][86884] Updated weights for policy 0, policy_version 60 (0.0013) +[2023-09-14 12:00:27,232][86884] Updated weights for policy 0, policy_version 70 (0.0013) +[2023-09-14 12:00:28,359][97397] Fps is (10 sec: 13926.3, 60 sec: 8849.0, 300 sec: 8849.0). Total num frames: 299008. Throughput: 0: 2259.5. Samples: 76348. Policy #0 lag: (min: 0.0, avg: 1.3, max: 3.0) +[2023-09-14 12:00:30,156][86884] Updated weights for policy 0, policy_version 80 (0.0012) +[2023-09-14 12:00:32,992][86884] Updated weights for policy 0, policy_version 90 (0.0014) +[2023-09-14 12:00:33,359][97397] Fps is (10 sec: 14336.1, 60 sec: 9609.1, 300 sec: 9609.1). Total num frames: 372736. Throughput: 0: 2246.8. Samples: 87152. Policy #0 lag: (min: 0.0, avg: 1.2, max: 2.0) +[2023-09-14 12:00:35,799][86884] Updated weights for policy 0, policy_version 100 (0.0012) +[2023-09-14 12:00:38,359][97397] Fps is (10 sec: 14745.6, 60 sec: 10195.6, 300 sec: 10195.6). Total num frames: 446464. Throughput: 0: 2490.3. Samples: 109052. Policy #0 lag: (min: 0.0, avg: 1.3, max: 3.0) +[2023-09-14 12:00:38,713][86884] Updated weights for policy 0, policy_version 110 (0.0014) +[2023-09-14 12:00:41,254][86887] DAMAGECOUNT value on done: 148.0 +[2023-09-14 12:00:41,254][86887] DAMAGECOUNT value on done: 25.0 +[2023-09-14 12:00:41,255][86887] Sum rewards: 2.715, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.014', 'AMMO3': '0.028', 'AMMO4': '0.070', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.124', 'WEAPON3': '0.200', 'weapon5': '0.212', 'weapon2': '0.504', 'weapon3': '0.880', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.480'} +[2023-09-14 12:00:41,255][86887] Sum rewards: 2.051, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.051', 'weapon5': '0.052', 'WEAPON5': '0.100', 'AMMO4': '0.100', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.250', 'WEAPON3': '0.300', 'weapon4': '0.536', 'weapon3': '0.690', 'weapon2': '0.746', 'FRAGCOUNT': '1.000'} +[2023-09-14 12:00:41,354][86889] DAMAGECOUNT value on done: 60.0 +[2023-09-14 12:00:41,355][86889] DAMAGECOUNT value on done: 230.0 +[2023-09-14 12:00:41,356][86889] Sum rewards: 4.509, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.007', 'AMMO4': '0.018', 'AMMO3': '0.047', 'WEAPON4': '0.100', 'weapon5': '0.190', 'WEAPON5': '0.200', 'weapon4': '0.258', 'WEAPON3': '0.300', 'weapon2': '0.660', 'weapon3': '1.026', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.300'} +[2023-09-14 12:00:41,641][86884] Updated weights for policy 0, policy_version 120 (0.0013) +[2023-09-14 12:00:42,025][86887] DAMAGECOUNT value on done: 20.0 +[2023-09-14 12:00:42,025][86887] DAMAGECOUNT value on done: 150.0 +[2023-09-14 12:00:42,025][86887] Sum rewards: 1.429, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.008', 'weapon5': '0.042', 'AMMO3': '0.071', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.200', 'weapon4': '0.388', 'WEAPON3': '0.400', 'weapon3': '0.532', 'weapon2': '0.580', 'FRAGCOUNT': '1.000'} +[2023-09-14 12:00:42,026][86887] Sum rewards: 3.509, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.018', 'weapon4': '0.028', 'AMMO3': '0.061', 'AMMO4': '0.087', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.160', 'WEAPON3': '0.400', 'weapon2': '0.662', 'FRAGCOUNT': '1.000', 'weapon3': '1.388', 'DAMAGECOUNT': '1.500'} +[2023-09-14 12:00:42,091][86889] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:00:42,091][86889] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:00:42,092][86889] Sum rewards: 2.619, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.021', 'AMMO3': '0.023', 'WEAPON5': '0.100', 'weapon5': '0.102', 'AMMO4': '0.102', 'WEAPON3': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.220', 'weapon2': '0.608', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '1.040'} +[2023-09-14 12:00:42,588][86887] DAMAGECOUNT value on done: 115.0 +[2023-09-14 12:00:42,588][86887] DAMAGECOUNT value on done: 10.0 +[2023-09-14 12:00:42,589][86887] Sum rewards: 4.568, reward structure: {'HEALTH': '-0.100', 'HITCOUNT': '0.000', 'AMMO2': '0.023', 'AMMO3': '0.026', 'WEAPON4': '0.100', 'AMMO4': '0.116', 'WEAPON3': '0.200', 'weapon2': '0.470', 'weapon4': '0.492', 'FRAGCOUNT': '1.000', 'weapon3': '1.090', 'DAMAGECOUNT': '1.150'} +[2023-09-14 12:00:42,589][86887] Sum rewards: -2.937, reward structure: {'HEALTH': '-3.150', 'DEATHCOUNT': '-3.000', 'FRAGCOUNT': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.011', 'AMMO4': '0.055', 'DAMAGECOUNT': '0.100', 'AMMO3': '0.127', 'weapon5': '0.162', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.302', 'weapon2': '0.562', 'WEAPON3': '0.700', 'weapon3': '0.788'} +[2023-09-14 12:00:42,667][86889] DAMAGECOUNT value on done: 20.0 +[2023-09-14 12:00:42,667][86889] DAMAGECOUNT value on done: 5.0 +[2023-09-14 12:00:42,741][86888] DAMAGECOUNT value on done: 165.0 +[2023-09-14 12:00:42,741][86888] DAMAGECOUNT value on done: 5.0 +[2023-09-14 12:00:42,742][86888] Sum rewards: 3.826, reward structure: {'HEALTH': '-0.920', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.006', 'AMMO3': '0.026', 'AMMO4': '0.031', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.156', 'weapon5': '0.162', 'WEAPON3': '0.200', 'weapon2': '0.384', 'weapon3': '0.926', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.650'} +[2023-09-14 12:00:42,742][86888] Sum rewards: -1.446, reward structure: {'HEALTH': '-2.550', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.018', 'AMMO3': '0.045', 'DAMAGECOUNT': '0.050', 'weapon5': '0.064', 'AMMO4': '0.091', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.474', 'weapon2': '0.754', 'weapon3': '1.004'} +[2023-09-14 12:00:42,746][86892] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:00:42,746][86892] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:00:42,747][86892] Sum rewards: 4.040, reward structure: {'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO3': '0.020', 'WEAPON3': '0.200', 'weapon2': '0.684', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.166'} +[2023-09-14 12:00:42,944][86885] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:00:42,944][86885] DAMAGECOUNT value on done: 92.0 +[2023-09-14 12:00:42,945][86885] Sum rewards: 0.006, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.004', 'AMMO3': '0.033', 'AMMO2': '0.035', 'weapon5': '0.094', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.176', 'WEAPON3': '0.200', 'weapon4': '0.324', 'weapon2': '0.428', 'weapon3': '0.512'} +[2023-09-14 12:00:42,945][86885] Sum rewards: 1.704, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.065', 'WEAPON5': '0.200', 'weapon5': '0.300', 'WEAPON3': '0.400', 'weapon2': '0.600', 'DAMAGECOUNT': '0.920', 'weapon3': '1.228'} +[2023-09-14 12:00:43,140][86887] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:00:43,141][86887] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:00:43,181][86886] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:00:43,182][86886] DAMAGECOUNT value on done: 85.0 +[2023-09-14 12:00:43,183][86886] Sum rewards: 1.832, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.024', 'weapon4': '0.032', 'AMMO3': '0.063', 'weapon5': '0.086', 'WEAPON5': '0.100', 'AMMO4': '0.121', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.850', 'weapon2': '0.866', 'weapon3': '1.236'} +[2023-09-14 12:00:43,217][86889] DAMAGECOUNT value on done: 45.0 +[2023-09-14 12:00:43,217][86889] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:00:43,300][86888] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:00:43,300][86888] DAMAGECOUNT value on done: 85.0 +[2023-09-14 12:00:43,301][86888] Sum rewards: 1.528, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO5': '0.005', 'AMMO4': '0.005', 'AMMO3': '0.041', 'weapon5': '0.042', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.226', 'WEAPON3': '0.300', 'weapon2': '0.680', 'DAMAGECOUNT': '0.850', 'weapon3': '1.178'} +[2023-09-14 12:00:43,327][86892] DAMAGECOUNT value on done: 66.0 +[2023-09-14 12:00:43,328][86892] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:00:43,328][86892] Sum rewards: 1.429, reward structure: {'HEALTH': '-1.250', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.025', 'AMMO3': '0.046', 'WEAPON4': '0.100', 'AMMO4': '0.126', 'WEAPON5': '0.200', 'weapon4': '0.258', 'WEAPON3': '0.300', 'weapon5': '0.318', 'weapon2': '0.474', 'DAMAGECOUNT': '0.750', 'weapon3': '1.074'} +[2023-09-14 12:00:43,359][97397] Fps is (10 sec: 13926.4, 60 sec: 10494.0, 300 sec: 10494.0). Total num frames: 512000. Throughput: 0: 2883.1. Samples: 129740. Policy #0 lag: (min: 0.0, avg: 1.0, max: 3.0) +[2023-09-14 12:00:43,360][97397] Avg episode reward: [(0, '1.581')] +[2023-09-14 12:00:43,361][86679] Saving new best policy, reward=1.581! +[2023-09-14 12:00:43,516][86885] DAMAGECOUNT value on done: 79.0 +[2023-09-14 12:00:43,517][86885] DAMAGECOUNT value on done: 47.0 +[2023-09-14 12:00:43,518][86885] Sum rewards: 1.159, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.016', 'AMMO3': '0.068', 'AMMO4': '0.078', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.116', 'weapon4': '0.218', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.470', 'weapon2': '0.532', 'weapon3': '1.058'} +[2023-09-14 12:00:43,765][86886] DAMAGECOUNT value on done: 117.0 +[2023-09-14 12:00:43,765][86886] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:00:43,765][86886] Sum rewards: 0.938, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.006', 'AMMO5': '0.009', 'AMMO4': '0.031', 'weapon4': '0.042', 'AMMO3': '0.083', 'WEAPON4': '0.100', 'weapon5': '0.132', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'weapon2': '0.630', 'FRAGCOUNT': '0.999', 'weapon3': '1.036', 'DAMAGECOUNT': '1.170'} +[2023-09-14 12:00:43,766][86886] Sum rewards: 1.902, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.031', 'AMMO3': '0.048', 'DAMAGECOUNT': '0.150', 'AMMO4': '0.153', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.520', 'weapon2': '0.530', 'weapon3': '0.970', 'FRAGCOUNT': '1.000'} +[2023-09-14 12:00:43,782][86891] DAMAGECOUNT value on done: 20.0 +[2023-09-14 12:00:43,782][86891] DAMAGECOUNT value on done: 10.0 +[2023-09-14 12:00:43,783][86891] Sum rewards: 0.681, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.014', 'AMMO3': '0.046', 'AMMO4': '0.070', 'WEAPON4': '0.100', 'weapon5': '0.186', 'weapon4': '0.196', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.592', 'weapon3': '0.870'} +[2023-09-14 12:00:43,783][86891] Sum rewards: 1.002, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.023', 'AMMO3': '0.061', 'DAMAGECOUNT': '0.100', 'weapon5': '0.190', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.838', 'weapon3': '1.378'} +[2023-09-14 12:00:43,859][86888] DAMAGECOUNT value on done: 60.0 +[2023-09-14 12:00:43,860][86888] Sum rewards: 1.229, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO3': '0.036', 'WEAPON5': '0.100', 'weapon5': '0.100', 'WEAPON3': '0.300', 'weapon2': '0.528', 'DAMAGECOUNT': '0.600', 'weapon3': '1.578'} +[2023-09-14 12:00:43,859][86888] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:00:43,904][86892] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:00:43,904][86892] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:00:43,905][86892] Sum rewards: 0.758, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.004', 'AMMO2': '0.033', 'AMMO3': '0.068', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.104', 'AMMO4': '0.164', 'weapon4': '0.354', 'WEAPON3': '0.400', 'weapon2': '0.548', 'weapon3': '1.034'} +[2023-09-14 12:00:44,036][97397] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 97397], exiting... +[2023-09-14 12:00:44,037][86679] Stopping Batcher_0... +[2023-09-14 12:00:44,037][97397] Runner profile tree view: +main_loop: 53.4895 +[2023-09-14 12:00:44,038][86679] Loop batcher_evt_loop terminating... +[2023-09-14 12:00:44,039][86679] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000128_524288.pth... +[2023-09-14 12:00:44,039][97397] Collected {0: 520192}, FPS: 9725.1 +[2023-09-14 12:00:44,064][86884] Weights refcount: 2 0 +[2023-09-14 12:00:44,065][86884] Stopping InferenceWorker_p0-w0... +[2023-09-14 12:00:44,066][86884] Loop inference_proc0-0_evt_loop terminating... +[2023-09-14 12:00:44,094][86679] Stopping LearnerWorker_p0... +[2023-09-14 12:00:44,094][86679] Loop learner_proc0_evt_loop terminating... +[2023-09-14 12:00:44,843][86891] Stopping RolloutWorker_w7... +[2023-09-14 12:00:44,843][86891] Loop rollout_proc7_evt_loop terminating... +[2023-09-14 12:00:44,847][86889] Stopping RolloutWorker_w4... +[2023-09-14 12:00:44,848][86889] Loop rollout_proc4_evt_loop terminating... +[2023-09-14 12:00:44,849][86887] Stopping RolloutWorker_w3... +[2023-09-14 12:00:44,849][86887] Loop rollout_proc3_evt_loop terminating... +[2023-09-14 12:00:44,849][86892] Stopping RolloutWorker_w6... +[2023-09-14 12:00:44,850][86892] Loop rollout_proc6_evt_loop terminating... +[2023-09-14 12:00:44,856][86885] Stopping RolloutWorker_w0... +[2023-09-14 12:00:44,856][86885] Loop rollout_proc0_evt_loop terminating... +[2023-09-14 12:00:44,864][86886] Stopping RolloutWorker_w2... +[2023-09-14 12:00:44,865][86886] Loop rollout_proc2_evt_loop terminating... +[2023-09-14 12:00:44,871][86890] Stopping RolloutWorker_w5... +[2023-09-14 12:00:44,872][86890] Loop rollout_proc5_evt_loop terminating... +[2023-09-14 12:00:44,872][86888] Stopping RolloutWorker_w1... +[2023-09-14 12:00:44,872][86888] Loop rollout_proc1_evt_loop terminating... +[2023-09-14 12:00:45,671][97397] Environment doom_basic already registered, overwriting... +[2023-09-14 12:00:45,672][97397] Environment doom_two_colors_easy already registered, overwriting... +[2023-09-14 12:00:45,674][97397] Environment doom_two_colors_hard already registered, overwriting... +[2023-09-14 12:00:45,675][97397] Environment doom_dm already registered, overwriting... +[2023-09-14 12:00:45,676][97397] Environment doom_dwango5 already registered, overwriting... +[2023-09-14 12:00:45,677][97397] Environment doom_my_way_home_flat_actions already registered, overwriting... +[2023-09-14 12:00:45,678][97397] Environment doom_defend_the_center_flat_actions already registered, overwriting... +[2023-09-14 12:00:45,679][97397] Environment doom_my_way_home already registered, overwriting... +[2023-09-14 12:00:45,680][97397] Environment doom_deadly_corridor already registered, overwriting... +[2023-09-14 12:00:45,682][97397] Environment doom_defend_the_center already registered, overwriting... +[2023-09-14 12:00:45,683][97397] Environment doom_defend_the_line already registered, overwriting... +[2023-09-14 12:00:45,684][97397] Environment doom_health_gathering already registered, overwriting... +[2023-09-14 12:00:45,685][97397] Environment doom_health_gathering_supreme already registered, overwriting... +[2023-09-14 12:00:45,687][97397] Environment doom_battle already registered, overwriting... +[2023-09-14 12:00:45,688][97397] Environment doom_battle2 already registered, overwriting... +[2023-09-14 12:00:45,689][97397] Environment doom_duel_bots already registered, overwriting... +[2023-09-14 12:00:45,689][97397] Environment doom_deathmatch_bots already registered, overwriting... +[2023-09-14 12:00:45,690][97397] Environment doom_duel already registered, overwriting... +[2023-09-14 12:00:45,690][97397] Environment doom_deathmatch_full already registered, overwriting... +[2023-09-14 12:00:45,691][97397] Environment doom_benchmark already registered, overwriting... +[2023-09-14 12:00:45,692][97397] register_encoder_factory: +[2023-09-14 12:00:45,716][97397] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json +[2023-09-14 12:00:45,721][97397] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists! +[2023-09-14 12:00:45,722][97397] Resuming existing experiment from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment... +[2023-09-14 12:00:45,723][97397] Weights and Biases integration disabled +[2023-09-14 12:00:45,726][97397] Environment var CUDA_VISIBLE_DEVICES is 0,1 + +[2023-09-14 12:00:47,745][97397] Starting experiment with the following configuration: +help=False +algo=APPO +env=doom_duel +experiment=default_experiment +train_dir=/home/cogstack/Documents/optuna/environments/sample_factory/train_dir +restart_behavior=resume +device=gpu +seed=None +num_policies=1 +async_rl=True +serial_mode=False +batched_sampling=False +num_batches_to_accumulate=2 +worker_num_splits=2 +policy_workers_per_policy=1 +max_policy_lag=1000 +num_workers=8 +num_envs_per_worker=4 +batch_size=1024 +num_batches_per_epoch=1 +num_epochs=1 +rollout=32 +recurrence=32 +shuffle_minibatches=False +gamma=0.99 +reward_scale=1.0 +reward_clip=1000.0 +value_bootstrap=False +normalize_returns=True +exploration_loss_coeff=0.001 +value_loss_coeff=0.5 +kl_loss_coeff=0.0 +exploration_loss=symmetric_kl +gae_lambda=0.95 +ppo_clip_ratio=0.1 +ppo_clip_value=0.2 +with_vtrace=False +vtrace_rho=1.0 +vtrace_c=1.0 +optimizer=adam +adam_eps=1e-06 +adam_beta1=0.9 +adam_beta2=0.999 +max_grad_norm=4.0 +learning_rate=0.0001 +lr_schedule=constant +lr_schedule_kl_threshold=0.008 +lr_adaptive_min=1e-06 +lr_adaptive_max=0.01 +obs_subtract_mean=0.0 +obs_scale=255.0 +normalize_input=True +normalize_input_keys=None +decorrelate_experience_max_seconds=0 +decorrelate_envs_on_one_worker=True +actor_worker_gpus=[] +set_workers_cpu_affinity=True +force_envs_single_thread=False +default_niceness=0 +log_to_file=True +experiment_summaries_interval=10 +flush_summaries_interval=30 +stats_avg=100 +summaries_use_frameskip=True +heartbeat_interval=20 +heartbeat_reporting_interval=600 +train_for_env_steps=1000000 +train_for_seconds=10000000000 +save_every_sec=120 +keep_checkpoints=2 +load_checkpoint_kind=latest +save_milestones_sec=-1 +save_best_every_sec=5 +save_best_metric=reward +save_best_after=100000 +benchmark=False +encoder_mlp_layers=[512, 512] +encoder_conv_architecture=convnet_simple +encoder_conv_mlp_layers=[512] +use_rnn=True +rnn_size=512 +rnn_type=gru +rnn_num_layers=1 +decoder_mlp_layers=[] +nonlinearity=elu +policy_initialization=orthogonal +policy_init_gain=1.0 +actor_critic_share_weights=True +adaptive_stddev=True +continuous_tanh_scale=0.0 +initial_stddev=1.0 +use_env_info_cache=False +env_gpu_actions=False +env_gpu_observations=True +env_frameskip=4 +env_framestack=1 +pixel_format=CHW +use_record_episode_statistics=False +with_wandb=False +wandb_user=None +wandb_project=sample_factory +wandb_group=None +wandb_job_type=SF +wandb_tags=[] +with_pbt=False +pbt_mix_policies_in_one_env=True +pbt_period_env_steps=5000000 +pbt_start_mutation=20000000 +pbt_replace_fraction=0.3 +pbt_mutation_rate=0.15 +pbt_replace_reward_gap=0.1 +pbt_replace_reward_gap_absolute=1e-06 +pbt_optimize_gamma=False +pbt_target_objective=true_objective +pbt_perturb_min=1.1 +pbt_perturb_max=1.5 +num_agents=-1 +num_humans=0 +num_bots=-1 +start_bot_difficulty=None +timelimit=None +res_w=128 +res_h=72 +wide_aspect_ratio=False +eval_env_frameskip=1 +fps=35 +command_line=--env=doom_dm --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=20000000 +cli_args={'env': 'doom_dm', 'num_workers': 8, 'num_envs_per_worker': 4, 'train_for_env_steps': 20000000} +git_hash=20b6d44612dad7d171f23e13b1f3b4c5e5631cf9 +git_repo_name=https://github.com/MattStammers/optuna.git +[2023-09-14 12:00:47,747][97397] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... +[2023-09-14 12:00:47,865][97397] Rollout worker 0 uses device cpu +[2023-09-14 12:00:47,867][97397] Rollout worker 1 uses device cpu +[2023-09-14 12:00:47,868][97397] Rollout worker 2 uses device cpu +[2023-09-14 12:00:47,869][97397] Rollout worker 3 uses device cpu +[2023-09-14 12:00:47,870][97397] Rollout worker 4 uses device cpu +[2023-09-14 12:00:47,871][97397] Rollout worker 5 uses device cpu +[2023-09-14 12:00:47,872][97397] Rollout worker 6 uses device cpu +[2023-09-14 12:00:47,874][97397] Rollout worker 7 uses device cpu +[2023-09-14 12:00:47,938][97397] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:00:47,939][97397] InferenceWorker_p0-w0: min num requests: 2 +[2023-09-14 12:00:47,967][97397] Starting all processes... +[2023-09-14 12:00:47,968][97397] Starting process learner_proc0 +[2023-09-14 12:00:49,630][97397] Starting all processes... +[2023-09-14 12:00:49,632][92931] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:00:49,632][92931] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 +[2023-09-14 12:00:49,635][97397] Starting process inference_proc0-0 +[2023-09-14 12:00:49,636][97397] Starting process rollout_proc0 +[2023-09-14 12:00:49,636][97397] Starting process rollout_proc1 +[2023-09-14 12:00:49,637][97397] Starting process rollout_proc2 +[2023-09-14 12:00:49,637][97397] Starting process rollout_proc3 +[2023-09-14 12:00:49,638][97397] Starting process rollout_proc4 +[2023-09-14 12:00:49,652][92931] Num visible devices: 1 +[2023-09-14 12:00:49,639][97397] Starting process rollout_proc5 +[2023-09-14 12:00:49,669][92931] Starting seed is not provided +[2023-09-14 12:00:49,669][92931] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:00:49,669][92931] Initializing actor-critic model on device cuda:0 +[2023-09-14 12:00:49,670][92931] RunningMeanStd input shape: (23,) +[2023-09-14 12:00:49,670][92931] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:00:49,671][92931] RunningMeanStd input shape: (1,) +[2023-09-14 12:00:49,639][97397] Starting process rollout_proc6 +[2023-09-14 12:00:49,639][97397] Starting process rollout_proc7 +[2023-09-14 12:00:49,684][92931] ConvEncoder: input_channels=3 +[2023-09-14 12:00:49,847][92931] Conv encoder output size: 512 +[2023-09-14 12:00:49,848][92931] Policy head output size: 640 +[2023-09-14 12:00:49,872][92931] Created Actor Critic model with architecture: +[2023-09-14 12:00:49,873][92931] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (measurements): RunningMeanStdInPlace() + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): VizdoomEncoder( + (basic_encoder): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ELU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ELU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ELU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ELU) + ) + ) + ) + (measurements_head): Sequential( + (0): Linear(in_features=23, out_features=128, bias=True) + (1): ELU(alpha=1.0) + (2): Linear(in_features=128, out_features=128, bias=True) + (3): ELU(alpha=1.0) + ) + ) + (core): ModelCoreRNN( + (core): GRU(640, 512) + ) + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=41, bias=True) + ) +) +[2023-09-14 12:00:51,052][92931] Using optimizer +[2023-09-14 12:00:51,053][92931] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000128_524288.pth... +[2023-09-14 12:00:51,084][92931] Loading model from checkpoint +[2023-09-14 12:00:51,089][92931] Loaded experiment state at self.train_step=128, self.env_steps=524288 +[2023-09-14 12:00:51,090][92931] Initialized policy 0 weights for model version 128 +[2023-09-14 12:00:51,092][92931] LearnerWorker_p0 finished initialization! +[2023-09-14 12:00:51,093][92931] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:00:51,731][93249] Worker 7 uses CPU cores [28, 29, 30, 31] +[2023-09-14 12:00:51,751][93222] Worker 0 uses CPU cores [0, 1, 2, 3] +[2023-09-14 12:00:51,879][93245] Worker 5 uses CPU cores [20, 21, 22, 23] +[2023-09-14 12:00:51,927][93244] Worker 1 uses CPU cores [4, 5, 6, 7] +[2023-09-14 12:00:51,983][93246] Worker 3 uses CPU cores [12, 13, 14, 15] +[2023-09-14 12:00:51,985][93248] Worker 4 uses CPU cores [16, 17, 18, 19] +[2023-09-14 12:00:52,046][93247] Worker 6 uses CPU cores [24, 25, 26, 27] +[2023-09-14 12:00:52,095][93243] Worker 2 uses CPU cores [8, 9, 10, 11] +[2023-09-14 12:00:52,233][97397] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 524288. Throughput: 0: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:00:52,235][93205] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:00:52,235][93205] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 +[2023-09-14 12:00:52,255][93205] Num visible devices: 1 +[2023-09-14 12:00:52,883][93205] RunningMeanStd input shape: (23,) +[2023-09-14 12:00:52,883][93205] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:00:52,883][93205] RunningMeanStd input shape: (1,) +[2023-09-14 12:00:52,896][93205] ConvEncoder: input_channels=3 +[2023-09-14 12:00:52,999][93205] Conv encoder output size: 512 +[2023-09-14 12:00:53,000][93205] Policy head output size: 640 +[2023-09-14 12:00:53,283][97397] Inference worker 0-0 is ready! +[2023-09-14 12:00:53,285][97397] All inference workers are ready! Signal rollout workers to start! +[2023-09-14 12:00:53,288][93246] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,288][93245] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,289][93244] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,289][93247] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,289][93248] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,289][93243] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,292][93249] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,293][93222] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,320][93245] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:00:53,320][93246] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:00:53,321][93247] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:00:53,322][93248] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:00:53,322][93245] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,323][93246] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,324][93247] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,325][93222] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:00:53,325][93248] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,326][93249] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:00:53,326][93243] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:00:53,328][93222] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,329][93243] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,329][93249] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,336][93244] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:00:53,340][93244] Multi agent env, num agents: 2 +[2023-09-14 12:00:53,352][93246] Port 40600 is available +[2023-09-14 12:00:53,352][93246] Using port 40600 +[2023-09-14 12:00:53,353][93245] Port 40800 is available +[2023-09-14 12:00:53,353][93245] Using port 40800 +[2023-09-14 12:00:53,353][93246] Initializing env for player 0, init_info: {'port': 40600}... +[2023-09-14 12:00:53,354][93247] Port 40900 is available +[2023-09-14 12:00:53,354][93247] Using port 40900 +[2023-09-14 12:00:53,354][93248] Port 40700 is available +[2023-09-14 12:00:53,354][93248] Using port 40700 +[2023-09-14 12:00:53,355][93245] Initializing env for player 0, init_info: {'port': 40800}... +[2023-09-14 12:00:53,355][93248] Initializing env for player 0, init_info: {'port': 40700}... +[2023-09-14 12:00:53,358][93222] Port 40300 is available +[2023-09-14 12:00:53,358][93222] Using port 40300 +[2023-09-14 12:00:53,358][93249] UDP port 41000 cannot be used [Errno 98] Address already in use +[2023-09-14 12:00:53,359][93249] Port 42000 is available +[2023-09-14 12:00:53,359][93249] Using port 42000 +[2023-09-14 12:00:53,359][93222] Initializing env for player 0, init_info: {'port': 40300}... +[2023-09-14 12:00:53,360][93249] Initializing env for player 0, init_info: {'port': 42000}... +[2023-09-14 12:00:53,360][93243] Port 40500 is available +[2023-09-14 12:00:53,360][93243] Using port 40500 +[2023-09-14 12:00:53,361][93243] Initializing env for player 0, init_info: {'port': 40500}... +[2023-09-14 12:00:53,384][93245] Using port 40800 on host... +[2023-09-14 12:00:53,386][93244] Port 40400 is available +[2023-09-14 12:00:53,386][93244] Using port 40400 +[2023-09-14 12:00:53,387][93244] Initializing env for player 0, init_info: {'port': 40400}... +[2023-09-14 12:00:53,389][93222] Using port 40300 on host... +[2023-09-14 12:00:53,390][93243] Using port 40500 on host... +[2023-09-14 12:00:53,391][93249] Using port 42000 on host... +[2023-09-14 12:00:53,392][93248] Using port 40700 on host... +[2023-09-14 12:00:53,399][93246] Using port 40600 on host... +[2023-09-14 12:00:53,406][93248] Initializing env for player 1, init_info: {'port': 40700}... +[2023-09-14 12:00:53,406][93245] Initializing env for player 1, init_info: {'port': 40800}... +[2023-09-14 12:00:53,410][93222] Initializing env for player 1, init_info: {'port': 40300}... +[2023-09-14 12:00:53,410][93249] Initializing env for player 1, init_info: {'port': 42000}... +[2023-09-14 12:00:53,411][93243] Initializing env for player 1, init_info: {'port': 40500}... +[2023-09-14 12:00:53,411][93246] Initializing env for player 1, init_info: {'port': 40600}... +[2023-09-14 12:00:53,425][93244] Using port 40400 on host... +[2023-09-14 12:00:53,438][93244] Initializing env for player 1, init_info: {'port': 40400}... +[2023-09-14 12:00:54,433][93243] Initialized w:2 v:0 player:1 +[2023-09-14 12:00:54,475][93248] Initialized w:4 v:0 player:0 +[2023-09-14 12:00:54,476][93248] Initialized w:4 v:0 player:1 +[2023-09-14 12:00:54,477][93248] 2 agent workers initialized for env 4! +[2023-09-14 12:00:54,486][93248] Decorrelating experience for 0 frames... +[2023-09-14 12:00:54,487][93248] Port 40701 is available +[2023-09-14 12:00:54,487][93248] Using port 40701 +[2023-09-14 12:00:54,487][93248] Initializing env for player 0, init_info: {'port': 40701}... +[2023-09-14 12:00:54,516][93248] Using port 40701 on host... +[2023-09-14 12:00:54,538][93248] Initializing env for player 1, init_info: {'port': 40701}... +[2023-09-14 12:00:54,560][93222] Initialized w:0 v:0 player:1 +[2023-09-14 12:00:54,561][93222] Initialized w:0 v:0 player:0 +[2023-09-14 12:00:54,562][93222] 2 agent workers initialized for env 0! +[2023-09-14 12:00:54,572][93249] Initialized w:7 v:0 player:1 +[2023-09-14 12:00:54,574][93222] Decorrelating experience for 0 frames... +[2023-09-14 12:00:54,575][93222] Port 40301 is available +[2023-09-14 12:00:54,575][93249] Initialized w:7 v:0 player:0 +[2023-09-14 12:00:54,575][93222] Using port 40301 +[2023-09-14 12:00:54,575][93246] Initialized w:3 v:0 player:1 +[2023-09-14 12:00:54,575][93246] Initialized w:3 v:0 player:0 +[2023-09-14 12:00:54,576][93222] Initializing env for player 0, init_info: {'port': 40301}... +[2023-09-14 12:00:54,576][93249] 2 agent workers initialized for env 7! +[2023-09-14 12:00:54,577][93246] 2 agent workers initialized for env 3! +[2023-09-14 12:00:54,585][93244] Initialized w:1 v:0 player:1 +[2023-09-14 12:00:54,586][93244] Initialized w:1 v:0 player:0 +[2023-09-14 12:00:54,587][93246] Decorrelating experience for 0 frames... +[2023-09-14 12:00:54,588][93244] 2 agent workers initialized for env 1! +[2023-09-14 12:00:54,588][93246] Port 40601 is available +[2023-09-14 12:00:54,589][93246] Using port 40601 +[2023-09-14 12:00:54,589][93246] Initializing env for player 0, init_info: {'port': 40601}... +[2023-09-14 12:00:54,590][93245] Initialized w:5 v:0 player:1 +[2023-09-14 12:00:54,591][93245] Initialized w:5 v:0 player:0 +[2023-09-14 12:00:54,592][93245] 2 agent workers initialized for env 5! +[2023-09-14 12:00:54,605][93222] Using port 40301 on host... +[2023-09-14 12:00:54,607][93244] Decorrelating experience for 0 frames... +[2023-09-14 12:00:54,608][93245] Decorrelating experience for 0 frames... +[2023-09-14 12:00:54,608][93249] Decorrelating experience for 0 frames... +[2023-09-14 12:00:54,608][93244] Port 40401 is available +[2023-09-14 12:00:54,608][93245] Port 40801 is available +[2023-09-14 12:00:54,608][93244] Using port 40401 +[2023-09-14 12:00:54,609][93245] Using port 40801 +[2023-09-14 12:00:54,609][93249] UDP port 41001 cannot be used [Errno 98] Address already in use +[2023-09-14 12:00:54,609][93249] Port 42001 is available +[2023-09-14 12:00:54,609][93244] Initializing env for player 0, init_info: {'port': 40401}... +[2023-09-14 12:00:54,609][93245] Initializing env for player 0, init_info: {'port': 40801}... +[2023-09-14 12:00:54,609][93249] Using port 42001 +[2023-09-14 12:00:54,610][93249] Initializing env for player 0, init_info: {'port': 42001}... +[2023-09-14 12:00:54,617][93247] Initializing env for player 0, init_info: {'port': 40900}... +[2023-09-14 12:00:54,626][93222] Initializing env for player 1, init_info: {'port': 40301}... +[2023-09-14 12:00:54,634][93246] Using port 40601 on host... +[2023-09-14 12:00:54,640][93249] Using port 42001 on host... +[2023-09-14 12:00:54,642][93246] Initializing env for player 1, init_info: {'port': 40601}... +[2023-09-14 12:00:54,658][93244] Using port 40401 on host... +[2023-09-14 12:00:54,658][93245] Using port 40801 on host... +[2023-09-14 12:00:54,659][93245] Initializing env for player 1, init_info: {'port': 40801}... +[2023-09-14 12:00:54,660][93249] Initializing env for player 1, init_info: {'port': 42001}... +[2023-09-14 12:00:54,663][93247] Using port 40900 on host... +[2023-09-14 12:00:54,666][93244] Initializing env for player 1, init_info: {'port': 40401}... +[2023-09-14 12:00:54,683][93247] Initializing env for player 1, init_info: {'port': 40900}... +[2023-09-14 12:00:55,431][93243] Initialized w:2 v:0 player:0 +[2023-09-14 12:00:55,433][93243] 2 agent workers initialized for env 2! +[2023-09-14 12:00:55,447][93243] Decorrelating experience for 0 frames... +[2023-09-14 12:00:55,448][93243] Port 40501 is available +[2023-09-14 12:00:55,448][93243] Using port 40501 +[2023-09-14 12:00:55,448][93243] Initializing env for player 0, init_info: {'port': 40501}... +[2023-09-14 12:00:55,477][93243] Using port 40501 on host... +[2023-09-14 12:00:55,499][93243] Initializing env for player 1, init_info: {'port': 40501}... +[2023-09-14 12:00:55,669][93248] Initialized w:4 v:1 player:0 +[2023-09-14 12:00:55,670][93248] Initialized w:4 v:1 player:1 +[2023-09-14 12:00:55,671][93248] 2 agent workers initialized for env 4! +[2023-09-14 12:00:55,684][93248] Decorrelating experience for 32 frames... +[2023-09-14 12:00:55,726][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 524288. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:00:55,762][93248] Multi agent env, num agents: 2 +[2023-09-14 12:00:55,763][93245] Initialized w:5 v:1 player:0 +[2023-09-14 12:00:55,765][93245] Initialized w:5 v:1 player:1 +[2023-09-14 12:00:55,766][93245] 2 agent workers initialized for env 5! +[2023-09-14 12:00:55,770][93222] Initialized w:0 v:1 player:1 +[2023-09-14 12:00:55,770][93222] Initialized w:0 v:1 player:0 +[2023-09-14 12:00:55,771][93222] 2 agent workers initialized for env 0! +[2023-09-14 12:00:55,777][93245] Decorrelating experience for 32 frames... +[2023-09-14 12:00:55,781][93222] Decorrelating experience for 32 frames... +[2023-09-14 12:00:55,808][93248] Multi agent env, num agents: 2 +[2023-09-14 12:00:55,827][93249] Initialized w:7 v:1 player:1 +[2023-09-14 12:00:55,828][93249] Initialized w:7 v:1 player:0 +[2023-09-14 12:00:55,829][93249] 2 agent workers initialized for env 7! +[2023-09-14 12:00:55,840][93249] Decorrelating experience for 32 frames... +[2023-09-14 12:00:55,840][93244] Initialized w:1 v:1 player:0 +[2023-09-14 12:00:55,840][93244] Initialized w:1 v:1 player:1 +[2023-09-14 12:00:55,842][93244] 2 agent workers initialized for env 1! +[2023-09-14 12:00:55,843][93246] Initialized w:3 v:1 player:1 +[2023-09-14 12:00:55,844][93246] Initialized w:3 v:1 player:0 +[2023-09-14 12:00:55,846][93246] 2 agent workers initialized for env 3! +[2023-09-14 12:00:55,847][93248] Port 40702 is available +[2023-09-14 12:00:55,848][93248] Using port 40702 +[2023-09-14 12:00:55,848][93248] Initializing env for player 0, init_info: {'port': 40702}... +[2023-09-14 12:00:55,849][93247] Initialized w:6 v:0 player:1 +[2023-09-14 12:00:55,849][93247] Initialized w:6 v:0 player:0 +[2023-09-14 12:00:55,851][93247] 2 agent workers initialized for env 6! +[2023-09-14 12:00:55,855][93246] Decorrelating experience for 32 frames... +[2023-09-14 12:00:55,856][93244] Decorrelating experience for 32 frames... +[2023-09-14 12:00:55,860][93247] Decorrelating experience for 0 frames... +[2023-09-14 12:00:55,861][93247] Port 40901 is available +[2023-09-14 12:00:55,861][93247] Using port 40901 +[2023-09-14 12:00:55,861][93247] Initializing env for player 0, init_info: {'port': 40901}... +[2023-09-14 12:00:55,887][93222] Multi agent env, num agents: 2 +[2023-09-14 12:00:55,889][93248] Using port 40702 on host... +[2023-09-14 12:00:55,892][93247] Using port 40901 on host... +[2023-09-14 12:00:55,897][93245] Multi agent env, num agents: 2 +[2023-09-14 12:00:55,899][93248] Initializing env for player 1, init_info: {'port': 40702}... +[2023-09-14 12:00:55,914][93247] Initializing env for player 1, init_info: {'port': 40901}... +[2023-09-14 12:00:55,921][93222] Multi agent env, num agents: 2 +[2023-09-14 12:00:55,921][93249] Multi agent env, num agents: 2 +[2023-09-14 12:00:55,937][93246] Multi agent env, num agents: 2 +[2023-09-14 12:00:55,942][93245] Multi agent env, num agents: 2 +[2023-09-14 12:00:55,953][93222] Port 40302 is available +[2023-09-14 12:00:55,953][93222] Using port 40302 +[2023-09-14 12:00:55,954][93222] Initializing env for player 0, init_info: {'port': 40302}... +[2023-09-14 12:00:55,956][93249] Multi agent env, num agents: 2 +[2023-09-14 12:00:55,965][93244] Multi agent env, num agents: 2 +[2023-09-14 12:00:55,968][93246] Multi agent env, num agents: 2 +[2023-09-14 12:00:55,976][93245] Port 40802 is available +[2023-09-14 12:00:55,976][93245] Using port 40802 +[2023-09-14 12:00:55,976][93245] Initializing env for player 0, init_info: {'port': 40802}... +[2023-09-14 12:00:55,985][93249] UDP port 41002 cannot be used [Errno 98] Address already in use +[2023-09-14 12:00:55,986][93249] Port 42002 is available +[2023-09-14 12:00:55,986][93249] Using port 42002 +[2023-09-14 12:00:55,986][93249] Initializing env for player 0, init_info: {'port': 42002}... +[2023-09-14 12:00:55,994][93244] Multi agent env, num agents: 2 +[2023-09-14 12:00:55,997][93246] Port 40602 is available +[2023-09-14 12:00:55,998][93246] Using port 40602 +[2023-09-14 12:00:55,998][93246] Initializing env for player 0, init_info: {'port': 40602}... +[2023-09-14 12:00:55,999][93222] Using port 40302 on host... +[2023-09-14 12:00:56,004][93245] Using port 40802 on host... +[2023-09-14 12:00:56,008][93222] Initializing env for player 1, init_info: {'port': 40302}... +[2023-09-14 12:00:56,016][93249] Using port 42002 on host... +[2023-09-14 12:00:56,026][93244] Port 40402 is available +[2023-09-14 12:00:56,026][93244] Using port 40402 +[2023-09-14 12:00:56,027][93244] Initializing env for player 0, init_info: {'port': 40402}... +[2023-09-14 12:00:56,027][93245] Initializing env for player 1, init_info: {'port': 40802}... +[2023-09-14 12:00:56,029][93246] Using port 40602 on host... +[2023-09-14 12:00:56,037][93249] Initializing env for player 1, init_info: {'port': 42002}... +[2023-09-14 12:00:56,048][93246] Initializing env for player 1, init_info: {'port': 40602}... +[2023-09-14 12:00:56,074][93244] Using port 40402 on host... +[2023-09-14 12:00:56,077][93244] Initializing env for player 1, init_info: {'port': 40402}... +[2023-09-14 12:00:56,615][93243] Initialized w:2 v:1 player:1 +[2023-09-14 12:00:56,616][93243] Initialized w:2 v:1 player:0 +[2023-09-14 12:00:56,617][93243] 2 agent workers initialized for env 2! +[2023-09-14 12:00:56,631][93243] Decorrelating experience for 32 frames... +[2023-09-14 12:00:56,693][93243] Multi agent env, num agents: 2 +[2023-09-14 12:00:56,726][93243] Multi agent env, num agents: 2 +[2023-09-14 12:00:56,755][93243] Port 40502 is available +[2023-09-14 12:00:56,755][93243] Using port 40502 +[2023-09-14 12:00:56,949][93247] Initialized w:6 v:1 player:1 +[2023-09-14 12:00:56,949][93247] Initialized w:6 v:1 player:0 +[2023-09-14 12:00:56,951][93247] 2 agent workers initialized for env 6! +[2023-09-14 12:00:56,959][93247] Decorrelating experience for 32 frames... +[2023-09-14 12:00:57,027][93247] Multi agent env, num agents: 2 +[2023-09-14 12:00:57,057][93247] Multi agent env, num agents: 2 +[2023-09-14 12:00:57,072][93249] Initialized w:7 v:2 player:0 +[2023-09-14 12:00:57,074][93249] Initialized w:7 v:2 player:1 +[2023-09-14 12:00:57,074][93249] 2 agent workers initialized for env 7! +[2023-09-14 12:00:57,080][93248] Initialized w:4 v:2 player:1 +[2023-09-14 12:00:57,081][93248] Initialized w:4 v:2 player:0 +[2023-09-14 12:00:57,082][93248] 2 agent workers initialized for env 4! +[2023-09-14 12:00:57,087][93247] Port 40902 is available +[2023-09-14 12:00:57,087][93247] Using port 40902 +[2023-09-14 12:00:57,088][93249] Decorrelating experience for 64 frames... +[2023-09-14 12:00:57,088][93247] Initializing env for player 0, init_info: {'port': 40902}... +[2023-09-14 12:00:57,092][93248] Decorrelating experience for 64 frames... +[2023-09-14 12:00:57,110][93222] Initialized w:0 v:2 player:0 +[2023-09-14 12:00:57,111][93222] Initialized w:0 v:2 player:1 +[2023-09-14 12:00:57,112][93222] 2 agent workers initialized for env 0! +[2023-09-14 12:00:57,120][93222] Decorrelating experience for 64 frames... +[2023-09-14 12:00:57,122][93247] Using port 40902 on host... +[2023-09-14 12:00:57,139][93247] Initializing env for player 1, init_info: {'port': 40902}... +[2023-09-14 12:00:57,209][93245] Initialized w:5 v:2 player:0 +[2023-09-14 12:00:57,210][93245] Initialized w:5 v:2 player:1 +[2023-09-14 12:00:57,211][93245] 2 agent workers initialized for env 5! +[2023-09-14 12:00:57,218][93246] Initialized w:3 v:2 player:1 +[2023-09-14 12:00:57,219][93246] Initialized w:3 v:2 player:0 +[2023-09-14 12:00:57,220][93246] 2 agent workers initialized for env 3! +[2023-09-14 12:00:57,223][93245] Decorrelating experience for 64 frames... +[2023-09-14 12:00:57,230][93246] Decorrelating experience for 64 frames... +[2023-09-14 12:00:57,243][93248] Port 40703 is available +[2023-09-14 12:00:57,243][93248] Using port 40703 +[2023-09-14 12:00:57,244][93248] Initializing env for player 0, init_info: {'port': 40703}... +[2023-09-14 12:00:57,269][93222] Port 40303 is available +[2023-09-14 12:00:57,269][93222] Using port 40303 +[2023-09-14 12:00:57,269][93249] Port 41003 is available +[2023-09-14 12:00:57,270][93249] Using port 41003 +[2023-09-14 12:00:57,270][93249] Initializing env for player 0, init_info: {'port': 41003}... +[2023-09-14 12:00:57,277][93244] Initialized w:1 v:2 player:1 +[2023-09-14 12:00:57,277][93244] Initialized w:1 v:2 player:0 +[2023-09-14 12:00:57,278][93244] 2 agent workers initialized for env 1! +[2023-09-14 12:00:57,279][93248] Using port 40703 on host... +[2023-09-14 12:00:57,288][93244] Decorrelating experience for 64 frames... +[2023-09-14 12:00:57,294][93248] Initializing env for player 1, init_info: {'port': 40703}... +[2023-09-14 12:00:57,306][93249] Using port 41003 on host... +[2023-09-14 12:00:57,310][93243] Initializing env for player 0, init_info: {'port': 40502}... +[2023-09-14 12:00:57,321][93249] Initializing env for player 1, init_info: {'port': 41003}... +[2023-09-14 12:00:57,354][93243] Using port 40502 on host... +[2023-09-14 12:00:57,362][93243] Initializing env for player 1, init_info: {'port': 40502}... +[2023-09-14 12:00:57,415][93246] Port 40603 is available +[2023-09-14 12:00:57,415][93245] Port 40803 is available +[2023-09-14 12:00:57,415][93246] Using port 40603 +[2023-09-14 12:00:57,415][93245] Using port 40803 +[2023-09-14 12:00:57,416][93245] Initializing env for player 0, init_info: {'port': 40803}... +[2023-09-14 12:00:57,416][93246] Initializing env for player 0, init_info: {'port': 40603}... +[2023-09-14 12:00:57,452][93245] Using port 40803 on host... +[2023-09-14 12:00:57,462][93246] Using port 40603 on host... +[2023-09-14 12:00:57,467][93245] Initializing env for player 1, init_info: {'port': 40803}... +[2023-09-14 12:00:57,469][93246] Initializing env for player 1, init_info: {'port': 40603}... +[2023-09-14 12:00:57,473][93244] Port 40403 is available +[2023-09-14 12:00:57,473][93244] Using port 40403 +[2023-09-14 12:00:58,202][93247] Initialized w:6 v:2 player:1 +[2023-09-14 12:00:58,202][93247] Initialized w:6 v:2 player:0 +[2023-09-14 12:00:58,203][93247] 2 agent workers initialized for env 6! +[2023-09-14 12:00:58,213][93247] Decorrelating experience for 64 frames... +[2023-09-14 12:00:58,230][93222] Initializing env for player 0, init_info: {'port': 40303}... +[2023-09-14 12:00:58,265][93222] Using port 40303 on host... +[2023-09-14 12:00:58,281][93222] Initializing env for player 1, init_info: {'port': 40303}... +[2023-09-14 12:00:58,350][93247] Port 40903 is available +[2023-09-14 12:00:58,350][93247] Using port 40903 +[2023-09-14 12:00:58,408][93243] Initialized w:2 v:2 player:1 +[2023-09-14 12:00:58,409][93243] Initialized w:2 v:2 player:0 +[2023-09-14 12:00:58,410][93243] 2 agent workers initialized for env 2! +[2023-09-14 12:00:58,417][93243] Decorrelating experience for 64 frames... +[2023-09-14 12:00:58,438][93248] Initialized w:4 v:3 player:1 +[2023-09-14 12:00:58,438][93248] Initialized w:4 v:3 player:0 +[2023-09-14 12:00:58,440][93248] 2 agent workers initialized for env 4! +[2023-09-14 12:00:58,450][93248] Decorrelating experience for 96 frames... +[2023-09-14 12:00:58,506][93249] Initialized w:7 v:3 player:1 +[2023-09-14 12:00:58,507][93249] Initialized w:7 v:3 player:0 +[2023-09-14 12:00:58,509][93249] 2 agent workers initialized for env 7! +[2023-09-14 12:00:58,517][93245] Initialized w:5 v:3 player:1 +[2023-09-14 12:00:58,517][93245] Initialized w:5 v:3 player:0 +[2023-09-14 12:00:58,519][93245] 2 agent workers initialized for env 5! +[2023-09-14 12:00:58,519][93249] Decorrelating experience for 96 frames... +[2023-09-14 12:00:58,528][93245] Decorrelating experience for 96 frames... +[2023-09-14 12:00:58,532][93246] Initialized w:3 v:3 player:1 +[2023-09-14 12:00:58,533][93246] Initialized w:3 v:3 player:0 +[2023-09-14 12:00:58,534][93246] 2 agent workers initialized for env 3! +[2023-09-14 12:00:58,544][93246] Decorrelating experience for 96 frames... +[2023-09-14 12:00:58,552][93243] Port 40503 is available +[2023-09-14 12:00:58,552][93243] Using port 40503 +[2023-09-14 12:00:58,553][93243] Initializing env for player 0, init_info: {'port': 40503}... +[2023-09-14 12:00:58,553][93247] Initializing env for player 0, init_info: {'port': 40903}... +[2023-09-14 12:00:58,602][93243] Using port 40503 on host... +[2023-09-14 12:00:58,602][93247] Using port 40903 on host... +[2023-09-14 12:00:58,608][93247] Initializing env for player 1, init_info: {'port': 40903}... +[2023-09-14 12:00:58,609][93243] Initializing env for player 1, init_info: {'port': 40503}... +[2023-09-14 12:00:59,382][93222] Initialized w:0 v:3 player:1 +[2023-09-14 12:00:59,382][93222] Initialized w:0 v:3 player:0 +[2023-09-14 12:00:59,384][93222] 2 agent workers initialized for env 0! +[2023-09-14 12:00:59,393][93222] Decorrelating experience for 96 frames... +[2023-09-14 12:00:59,398][93244] Initializing env for player 0, init_info: {'port': 40403}... +[2023-09-14 12:00:59,434][93244] Using port 40403 on host... +[2023-09-14 12:00:59,449][93244] Initializing env for player 1, init_info: {'port': 40403}... +[2023-09-14 12:00:59,638][93243] Initialized w:2 v:3 player:1 +[2023-09-14 12:00:59,638][93243] Initialized w:2 v:3 player:0 +[2023-09-14 12:00:59,639][93243] 2 agent workers initialized for env 2! +[2023-09-14 12:00:59,647][93243] Decorrelating experience for 96 frames... +[2023-09-14 12:00:59,752][93247] Initialized w:6 v:3 player:1 +[2023-09-14 12:00:59,752][93247] Initialized w:6 v:3 player:0 +[2023-09-14 12:00:59,753][93247] 2 agent workers initialized for env 6! +[2023-09-14 12:00:59,763][93247] Decorrelating experience for 96 frames... +[2023-09-14 12:01:00,191][92931] Signal inference workers to stop experience collection... +[2023-09-14 12:01:00,197][93205] InferenceWorker_p0-w0: stopping experience collection +[2023-09-14 12:01:00,588][93244] Initialized w:1 v:3 player:1 +[2023-09-14 12:01:00,589][93244] Initialized w:1 v:3 player:0 +[2023-09-14 12:01:00,591][93244] 2 agent workers initialized for env 1! +[2023-09-14 12:01:00,602][93244] Decorrelating experience for 96 frames... +[2023-09-14 12:01:00,726][97397] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 524288. Throughput: 0: 49.9. Samples: 424. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:01:03,220][92931] Signal inference workers to resume experience collection... +[2023-09-14 12:01:03,220][93205] InferenceWorker_p0-w0: resuming experience collection +[2023-09-14 12:01:05,726][97397] Fps is (10 sec: 2457.6, 60 sec: 1821.4, 300 sec: 1821.4). Total num frames: 548864. Throughput: 0: 456.5. Samples: 6160. Policy #0 lag: (min: 0.0, avg: 1.6, max: 4.0) +[2023-09-14 12:01:06,786][93205] Updated weights for policy 0, policy_version 138 (0.0669) +[2023-09-14 12:01:07,944][97397] Heartbeat connected on RolloutWorker_w0 +[2023-09-14 12:01:07,948][97397] Heartbeat connected on RolloutWorker_w1 +[2023-09-14 12:01:07,951][97397] Heartbeat connected on RolloutWorker_w2 +[2023-09-14 12:01:07,953][97397] Heartbeat connected on Batcher_0 +[2023-09-14 12:01:07,955][97397] Heartbeat connected on RolloutWorker_w3 +[2023-09-14 12:01:07,957][97397] Heartbeat connected on LearnerWorker_p0 +[2023-09-14 12:01:07,960][97397] Heartbeat connected on InferenceWorker_p0-w0 +[2023-09-14 12:01:07,968][97397] Heartbeat connected on RolloutWorker_w4 +[2023-09-14 12:01:07,970][97397] Heartbeat connected on RolloutWorker_w5 +[2023-09-14 12:01:07,982][97397] Heartbeat connected on RolloutWorker_w6 +[2023-09-14 12:01:07,996][97397] Heartbeat connected on RolloutWorker_w7 +[2023-09-14 12:01:09,819][93205] Updated weights for policy 0, policy_version 148 (0.0012) +[2023-09-14 12:01:10,726][97397] Fps is (10 sec: 9420.8, 60 sec: 5094.2, 300 sec: 5094.2). Total num frames: 618496. Throughput: 0: 883.8. Samples: 16344. Policy #0 lag: (min: 0.0, avg: 1.1, max: 2.0) +[2023-09-14 12:01:12,673][93205] Updated weights for policy 0, policy_version 158 (0.0014) +[2023-09-14 12:01:15,518][93205] Updated weights for policy 0, policy_version 168 (0.0013) +[2023-09-14 12:01:15,726][97397] Fps is (10 sec: 13926.4, 60 sec: 6974.0, 300 sec: 6974.0). Total num frames: 688128. Throughput: 0: 1612.7. Samples: 37888. Policy #0 lag: (min: 0.0, avg: 1.1, max: 3.0) +[2023-09-14 12:01:18,292][93205] Updated weights for policy 0, policy_version 178 (0.0014) +[2023-09-14 12:01:20,726][97397] Fps is (10 sec: 14336.0, 60 sec: 8337.8, 300 sec: 8337.8). Total num frames: 761856. Throughput: 0: 2097.5. Samples: 59764. Policy #0 lag: (min: 0.0, avg: 1.1, max: 3.0) +[2023-09-14 12:01:20,803][93245] Large shaping reward 2.772 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 2.0), ('DAMAGECOUNT', 1.77, 177.0), ('weapon5', 0.002)] +[2023-09-14 12:01:21,063][93205] Updated weights for policy 0, policy_version 188 (0.0017) +[2023-09-14 12:01:23,844][93205] Updated weights for policy 0, policy_version 198 (0.0013) +[2023-09-14 12:01:25,726][97397] Fps is (10 sec: 14745.6, 60 sec: 9294.3, 300 sec: 9294.3). Total num frames: 835584. Throughput: 0: 2110.3. Samples: 70680. Policy #0 lag: (min: 0.0, avg: 1.0, max: 3.0) +[2023-09-14 12:01:26,691][93205] Updated weights for policy 0, policy_version 208 (0.0013) +[2023-09-14 12:01:29,663][93205] Updated weights for policy 0, policy_version 218 (0.0015) +[2023-09-14 12:01:30,726][97397] Fps is (10 sec: 14336.1, 60 sec: 9896.0, 300 sec: 9896.0). Total num frames: 905216. Throughput: 0: 2391.5. Samples: 92056. Policy #0 lag: (min: 0.0, avg: 1.1, max: 2.0) +[2023-09-14 12:01:32,485][93205] Updated weights for policy 0, policy_version 228 (0.0013) +[2023-09-14 12:01:35,293][93205] Updated weights for policy 0, policy_version 238 (0.0012) +[2023-09-14 12:01:35,726][97397] Fps is (10 sec: 14336.0, 60 sec: 10453.5, 300 sec: 10453.5). Total num frames: 978944. Throughput: 0: 2615.3. Samples: 113748. Policy #0 lag: (min: 0.0, avg: 0.9, max: 2.0) +[2023-09-14 12:01:37,508][92931] Stopping Batcher_0... +[2023-09-14 12:01:37,509][92931] Loop batcher_evt_loop terminating... +[2023-09-14 12:01:37,509][92931] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000246_1007616.pth... +[2023-09-14 12:01:37,515][97397] Component Batcher_0 stopped! +[2023-09-14 12:01:37,534][93205] Weights refcount: 2 0 +[2023-09-14 12:01:37,535][93205] Stopping InferenceWorker_p0-w0... +[2023-09-14 12:01:37,535][93205] Loop inference_proc0-0_evt_loop terminating... +[2023-09-14 12:01:37,535][97397] Component InferenceWorker_p0-w0 stopped! +[2023-09-14 12:01:37,566][92931] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000246_1007616.pth... +[2023-09-14 12:01:37,636][92931] Stopping LearnerWorker_p0... +[2023-09-14 12:01:37,636][92931] Loop learner_proc0_evt_loop terminating... +[2023-09-14 12:01:37,636][97397] Component LearnerWorker_p0 stopped! +[2023-09-14 12:01:38,318][93244] Stopping RolloutWorker_w1... +[2023-09-14 12:01:38,318][93244] Loop rollout_proc1_evt_loop terminating... +[2023-09-14 12:01:38,318][97397] Component RolloutWorker_w1 stopped! +[2023-09-14 12:01:38,319][93249] Stopping RolloutWorker_w7... +[2023-09-14 12:01:38,320][93249] Loop rollout_proc7_evt_loop terminating... +[2023-09-14 12:01:38,320][97397] Component RolloutWorker_w7 stopped! +[2023-09-14 12:01:38,365][93248] Stopping RolloutWorker_w4... +[2023-09-14 12:01:38,366][93248] Loop rollout_proc4_evt_loop terminating... +[2023-09-14 12:01:38,365][97397] Component RolloutWorker_w4 stopped! +[2023-09-14 12:01:38,369][93247] Stopping RolloutWorker_w6... +[2023-09-14 12:01:38,369][93245] Stopping RolloutWorker_w5... +[2023-09-14 12:01:38,370][93247] Loop rollout_proc6_evt_loop terminating... +[2023-09-14 12:01:38,370][93245] Loop rollout_proc5_evt_loop terminating... +[2023-09-14 12:01:38,369][97397] Component RolloutWorker_w6 stopped! +[2023-09-14 12:01:38,370][97397] Component RolloutWorker_w5 stopped! +[2023-09-14 12:01:38,371][93222] Stopping RolloutWorker_w0... +[2023-09-14 12:01:38,371][93222] Loop rollout_proc0_evt_loop terminating... +[2023-09-14 12:01:38,371][97397] Component RolloutWorker_w0 stopped! +[2023-09-14 12:01:38,377][93243] Stopping RolloutWorker_w2... +[2023-09-14 12:01:38,377][97397] Component RolloutWorker_w2 stopped! +[2023-09-14 12:01:38,377][93243] Loop rollout_proc2_evt_loop terminating... +[2023-09-14 12:01:38,379][93246] Stopping RolloutWorker_w3... +[2023-09-14 12:01:38,380][93246] Loop rollout_proc3_evt_loop terminating... +[2023-09-14 12:01:38,379][97397] Component RolloutWorker_w3 stopped! +[2023-09-14 12:01:38,380][97397] Waiting for process learner_proc0 to stop... +[2023-09-14 12:01:38,382][97397] Waiting for process inference_proc0-0 to join... +[2023-09-14 12:01:38,383][97397] Waiting for process rollout_proc0 to join... +[2023-09-14 12:01:38,898][97397] Waiting for process rollout_proc1 to join... +[2023-09-14 12:01:38,900][97397] Waiting for process rollout_proc2 to join... +[2023-09-14 12:01:38,902][97397] Waiting for process rollout_proc3 to join... +[2023-09-14 12:01:38,904][97397] Waiting for process rollout_proc4 to join... +[2023-09-14 12:01:38,905][97397] Waiting for process rollout_proc5 to join... +[2023-09-14 12:01:38,907][97397] Waiting for process rollout_proc6 to join... +[2023-09-14 12:01:38,909][97397] Waiting for process rollout_proc7 to join... +[2023-09-14 12:01:38,910][97397] Batcher 0 profile tree view: +batching: 1.0973, releasing_batches: 0.0041 +[2023-09-14 12:01:38,910][97397] InferenceWorker_p0-w0 profile tree view: +wait_policy: 0.0000 + wait_policy_total: 6.0334 +update_model: 1.0026 + weight_update: 0.0012 +one_step: 0.0044 + handle_policy_step: 32.6111 + deserialize: 0.9388, stack: 0.1084, obs_to_device_normalize: 5.3014, forward: 22.7441, send_messages: 0.8995 + prepare_outputs: 1.8688 + to_cpu: 0.9259 +[2023-09-14 12:01:38,912][97397] Learner 0 profile tree view: +misc: 0.0005, prepare_batch: 3.8245 +train: 9.2829 + epoch_init: 0.0006, minibatch_init: 0.0006, losses_postprocess: 0.0406, kl_divergence: 0.1054, after_optimizer: 0.1577 + calculate_losses: 2.1022 + losses_init: 0.0003, forward_head: 0.3496, bptt_initial: 1.2132, tail: 0.1426, advantages_returns: 0.0144, losses: 0.2471 + bptt: 0.1168 + bptt_forward_core: 0.1123 + update: 6.8274 + clip: 3.3160 +[2023-09-14 12:01:38,912][97397] RolloutWorker_w0 profile tree view: +wait_for_trajectories: 0.0158, enqueue_policy_requests: 0.8028, env_step: 23.0350, overhead: 0.5150, complete_rollouts: 0.0164 +save_policy_outputs: 1.0075 + split_output_tensors: 0.3470 +[2023-09-14 12:01:38,913][97397] RolloutWorker_w7 profile tree view: +wait_for_trajectories: 0.0160, enqueue_policy_requests: 0.8132, env_step: 23.7167, overhead: 0.5256, complete_rollouts: 0.0168 +save_policy_outputs: 1.0105 + split_output_tensors: 0.3476 +[2023-09-14 12:01:38,915][97397] Loop Runner_EvtLoop terminating... +[2023-09-14 12:01:38,916][97397] Runner profile tree view: +main_loop: 50.9484 +[2023-09-14 12:01:38,916][97397] Collected {0: 1007616}, FPS: 9486.6 +[2023-09-14 12:03:16,383][97397] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json +[2023-09-14 12:03:16,385][97397] Overriding arg 'num_workers' with value 1 passed from command line +[2023-09-14 12:03:16,386][97397] Adding new argument 'no_render'=True that is not in the saved config file! +[2023-09-14 12:03:16,386][97397] Adding new argument 'save_video'=True that is not in the saved config file! +[2023-09-14 12:03:16,387][97397] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file! +[2023-09-14 12:03:16,387][97397] Adding new argument 'video_name'=None that is not in the saved config file! +[2023-09-14 12:03:16,388][97397] Adding new argument 'max_num_frames'=1000000000.0 that is not in the saved config file! +[2023-09-14 12:03:16,389][97397] Adding new argument 'max_num_episodes'=10 that is not in the saved config file! +[2023-09-14 12:03:16,389][97397] Adding new argument 'push_to_hub'=False that is not in the saved config file! +[2023-09-14 12:03:16,390][97397] Adding new argument 'hf_repository'=None that is not in the saved config file! +[2023-09-14 12:03:16,391][97397] Adding new argument 'policy_index'=0 that is not in the saved config file! +[2023-09-14 12:03:16,392][97397] Adding new argument 'eval_deterministic'=False that is not in the saved config file! +[2023-09-14 12:03:16,392][97397] Adding new argument 'train_script'=None that is not in the saved config file! +[2023-09-14 12:03:16,393][97397] Adding new argument 'enjoy_script'=None that is not in the saved config file! +[2023-09-14 12:03:16,394][97397] Using frameskip 1 and render_action_repeat=4 for evaluation +[2023-09-14 12:03:16,397][97397] Multi agent env, num agents: 2 +[2023-09-14 12:03:16,424][97397] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:03:16,428][97397] RunningMeanStd input shape: (23,) +[2023-09-14 12:03:16,429][97397] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:03:16,430][97397] RunningMeanStd input shape: (1,) +[2023-09-14 12:03:16,443][97397] ConvEncoder: input_channels=3 +[2023-09-14 12:03:16,582][97397] Conv encoder output size: 512 +[2023-09-14 12:03:16,585][97397] Policy head output size: 640 +[2023-09-14 12:03:17,532][97397] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000246_1007616.pth... +[2023-09-14 12:03:17,565][97397] Port 40300 is available +[2023-09-14 12:03:17,567][97397] Using port 40300 +[2023-09-14 12:03:17,568][97397] Initializing env for player 0, init_info: {'port': 40300}... +[2023-09-14 12:03:17,618][97397] Initializing env for player 1, init_info: {'port': 40300}... +[2023-09-14 12:03:17,668][97397] 2 agent workers initialized for env 0! +[2023-09-14 12:03:17,670][97397] Using port 40300 on host... +[2023-09-14 12:03:18,724][97397] Initialized w:0 v:0 player:0 +[2023-09-14 12:03:18,725][97397] Initialized w:0 v:0 player:1 +[2023-09-14 12:03:19,234][97397] Num frames 100... +[2023-09-14 12:03:19,470][97397] Num frames 200... +[2023-09-14 12:03:19,714][97397] Num frames 300... +[2023-09-14 12:03:19,959][97397] Num frames 400... +[2023-09-14 12:03:20,180][97397] Num frames 500... +[2023-09-14 12:03:20,428][97397] Num frames 600... +[2023-09-14 12:03:20,660][97397] Num frames 700... +[2023-09-14 12:03:20,937][97397] Num frames 800... +[2023-09-14 12:03:21,231][97397] Num frames 900... +[2023-09-14 12:03:21,512][97397] Num frames 1000... +[2023-09-14 12:03:21,784][97397] Num frames 1100... +[2023-09-14 12:03:22,030][97397] Num frames 1200... +[2023-09-14 12:03:22,268][97397] Num frames 1300... +[2023-09-14 12:03:22,512][97397] Num frames 1400... +[2023-09-14 12:03:22,757][97397] Num frames 1500... +[2023-09-14 12:03:22,995][97397] Num frames 1600... +[2023-09-14 12:03:23,221][97397] Num frames 1700... +[2023-09-14 12:03:23,437][97397] Num frames 1800... +[2023-09-14 12:03:23,659][97397] Num frames 1900... +[2023-09-14 12:03:23,896][97397] Num frames 2000... +[2023-09-14 12:03:24,135][97397] Num frames 2100... +[2023-09-14 12:03:24,426][97397] Num frames 2200... +[2023-09-14 12:03:24,679][97397] Num frames 2300... +[2023-09-14 12:03:24,943][97397] Num frames 2400... +[2023-09-14 12:03:25,201][97397] Num frames 2500... +[2023-09-14 12:03:25,501][97397] Num frames 2600... +[2023-09-14 12:03:25,739][97397] Num frames 2700... +[2023-09-14 12:03:25,997][97397] Num frames 2800... +[2023-09-14 12:03:26,227][97397] Num frames 2900... +[2023-09-14 12:03:26,464][97397] Num frames 3000... +[2023-09-14 12:03:26,699][97397] Num frames 3100... +[2023-09-14 12:03:26,942][97397] Num frames 3200... +[2023-09-14 12:03:27,198][97397] Num frames 3300... +[2023-09-14 12:03:27,465][97397] Num frames 3400... +[2023-09-14 12:03:27,710][97397] Num frames 3500... +[2023-09-14 12:03:27,951][97397] Num frames 3600... +[2023-09-14 12:03:28,225][97397] Num frames 3700... +[2023-09-14 12:03:28,516][97397] Num frames 3800... +[2023-09-14 12:03:28,765][97397] Num frames 3900... +[2023-09-14 12:03:29,034][97397] Num frames 4000... +[2023-09-14 12:03:29,303][97397] Num frames 4100... +[2023-09-14 12:03:29,566][97397] Num frames 4200... +[2023-09-14 12:03:29,808][97397] Num frames 4300... +[2023-09-14 12:03:30,057][97397] Num frames 4400... +[2023-09-14 12:03:30,295][97397] Num frames 4500... +[2023-09-14 12:03:30,535][97397] Num frames 4600... +[2023-09-14 12:03:30,782][97397] Num frames 4700... +[2023-09-14 12:03:31,013][97397] Num frames 4800... +[2023-09-14 12:03:31,286][97397] Num frames 4900... +[2023-09-14 12:03:31,539][97397] Num frames 5000... +[2023-09-14 12:03:31,791][97397] Num frames 5100... +[2023-09-14 12:03:32,037][97397] Num frames 5200... +[2023-09-14 12:03:32,298][97397] Num frames 5300... +[2023-09-14 12:03:32,537][97397] Num frames 5400... +[2023-09-14 12:03:32,805][97397] Num frames 5500... +[2023-09-14 12:03:33,061][97397] Num frames 5600... +[2023-09-14 12:03:33,340][97397] Num frames 5700... +[2023-09-14 12:03:33,586][97397] Num frames 5800... +[2023-09-14 12:03:33,817][97397] Num frames 5900... +[2023-09-14 12:03:34,076][97397] Num frames 6000... +[2023-09-14 12:03:34,392][97397] Num frames 6100... +[2023-09-14 12:03:34,637][97397] Num frames 6200... +[2023-09-14 12:03:34,906][97397] Num frames 6300... +[2023-09-14 12:03:35,135][97397] Num frames 6400... +[2023-09-14 12:03:35,393][97397] Num frames 6500... +[2023-09-14 12:03:35,640][97397] Num frames 6600... +[2023-09-14 12:03:35,896][97397] Num frames 6700... +[2023-09-14 12:03:36,136][97397] Num frames 6800... +[2023-09-14 12:03:36,355][97397] Num frames 6900... +[2023-09-14 12:03:36,596][97397] Num frames 7000... +[2023-09-14 12:03:36,863][97397] Num frames 7100... +[2023-09-14 12:03:37,149][97397] Num frames 7200... +[2023-09-14 12:03:37,424][97397] Num frames 7300... +[2023-09-14 12:03:37,691][97397] Num frames 7400... +[2023-09-14 12:03:37,951][97397] Num frames 7500... +[2023-09-14 12:03:38,265][97397] Num frames 7600... +[2023-09-14 12:03:38,525][97397] Num frames 7700... +[2023-09-14 12:03:38,763][97397] Num frames 7800... +[2023-09-14 12:03:38,998][97397] Num frames 7900... +[2023-09-14 12:03:39,260][97397] Num frames 8000... +[2023-09-14 12:03:39,544][97397] Num frames 8100... +[2023-09-14 12:03:39,816][97397] Num frames 8200... +[2023-09-14 12:03:40,090][97397] Num frames 8300... +[2023-09-14 12:03:40,347][97397] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:03:40,347][97397] DAMAGECOUNT value on done: 12.0 +[2023-09-14 12:03:40,349][97397] Sum rewards: 14.318, reward structure: {'HEALTH': '-1.120', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.003', 'AMMO2': '0.014', 'AMMO3': '0.040', 'AMMO4': '0.069', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.400', 'weapon5': '0.574', 'weapon4': '0.602', 'weapon2': '1.536', 'weapon3': '13.002'} +[2023-09-14 12:03:40,416][97397] Avg episode rewards: #0: 10.216, #1: 14.318, true rewards: #0: 1.000, #1: 0.000 +[2023-09-14 12:03:40,418][97397] Avg episode reward: 12.267, avg true_objective: 0.500 +[2023-09-14 12:03:40,425][97397] Num frames 8400... +[2023-09-14 12:03:40,697][97397] Num frames 8500... +[2023-09-14 12:03:40,965][97397] Num frames 8600... +[2023-09-14 12:03:41,246][97397] Num frames 8700... +[2023-09-14 12:03:41,492][97397] Num frames 8800... +[2023-09-14 12:03:41,750][97397] Num frames 8900... +[2023-09-14 12:03:41,980][97397] Num frames 9000... +[2023-09-14 12:03:42,252][97397] Num frames 9100... +[2023-09-14 12:03:42,507][97397] Num frames 9200... +[2023-09-14 12:03:42,768][97397] Num frames 9300... +[2023-09-14 12:03:43,083][97397] Num frames 9400... +[2023-09-14 12:03:43,342][97397] Num frames 9500... +[2023-09-14 12:03:43,577][97397] Num frames 9600... +[2023-09-14 12:03:43,847][97397] Num frames 9700... +[2023-09-14 12:03:44,132][97397] Num frames 9800... +[2023-09-14 12:03:44,614][97397] Num frames 9900... +[2023-09-14 12:03:44,935][97397] Num frames 10000... +[2023-09-14 12:03:45,280][97397] Num frames 10100... +[2023-09-14 12:03:45,680][97397] Num frames 10200... +[2023-09-14 12:03:45,980][97397] Num frames 10300... +[2023-09-14 12:03:46,271][97397] Num frames 10400... +[2023-09-14 12:03:46,586][97397] Num frames 10500... +[2023-09-14 12:03:47,011][97397] Num frames 10600... +[2023-09-14 12:03:47,368][97397] Num frames 10700... +[2023-09-14 12:03:47,759][97397] Num frames 10800... +[2023-09-14 12:03:48,043][97397] Num frames 10900... +[2023-09-14 12:03:48,392][97397] Num frames 11000... +[2023-09-14 12:03:48,754][97397] Num frames 11100... +[2023-09-14 12:03:49,028][97397] Num frames 11200... +[2023-09-14 12:03:49,362][97397] Num frames 11300... +[2023-09-14 12:03:49,662][97397] Num frames 11400... +[2023-09-14 12:03:49,936][97397] Num frames 11500... +[2023-09-14 12:03:50,173][97397] Num frames 11600... +[2023-09-14 12:03:50,426][97397] Num frames 11700... +[2023-09-14 12:03:50,689][97397] Num frames 11800... +[2023-09-14 12:03:51,025][97397] Num frames 11900... +[2023-09-14 12:03:51,312][97397] Num frames 12000... +[2023-09-14 12:03:51,569][97397] Num frames 12100... +[2023-09-14 12:03:51,833][97397] Num frames 12200... +[2023-09-14 12:03:52,066][97397] Num frames 12300... +[2023-09-14 12:03:52,306][97397] Num frames 12400... +[2023-09-14 12:03:52,541][97397] Num frames 12500... +[2023-09-14 12:03:52,842][97397] Num frames 12600... +[2023-09-14 12:03:53,109][97397] Num frames 12700... +[2023-09-14 12:03:53,358][97397] Num frames 12800... +[2023-09-14 12:03:53,661][97397] Num frames 12900... +[2023-09-14 12:03:53,950][97397] Num frames 13000... +[2023-09-14 12:03:54,218][97397] Num frames 13100... +[2023-09-14 12:03:54,507][97397] Num frames 13200... +[2023-09-14 12:03:54,814][97397] Num frames 13300... +[2023-09-14 12:03:55,075][97397] Num frames 13400... +[2023-09-14 12:03:55,346][97397] Num frames 13500... +[2023-09-14 12:03:55,638][97397] Num frames 13600... +[2023-09-14 12:03:55,960][97397] Num frames 13700... +[2023-09-14 12:03:56,267][97397] Num frames 13800... +[2023-09-14 12:03:56,540][97397] Num frames 13900... +[2023-09-14 12:03:56,852][97397] Num frames 14000... +[2023-09-14 12:03:57,123][97397] Num frames 14100... +[2023-09-14 12:03:57,382][97397] Num frames 14200... +[2023-09-14 12:03:57,680][97397] Num frames 14300... +[2023-09-14 12:03:57,960][97397] Num frames 14400... +[2023-09-14 12:03:58,234][97397] Num frames 14500... +[2023-09-14 12:03:58,529][97397] Num frames 14600... +[2023-09-14 12:03:58,825][97397] Num frames 14700... +[2023-09-14 12:03:59,128][97397] Num frames 14800... +[2023-09-14 12:03:59,445][97397] Num frames 14900... +[2023-09-14 12:03:59,717][97397] Num frames 15000... +[2023-09-14 12:03:59,982][97397] Num frames 15100... +[2023-09-14 12:04:00,232][97397] Num frames 15200... +[2023-09-14 12:04:00,507][97397] Num frames 15300... +[2023-09-14 12:04:00,764][97397] Num frames 15400... +[2023-09-14 12:04:01,001][97397] Num frames 15500... +[2023-09-14 12:04:01,293][97397] Num frames 15600... +[2023-09-14 12:04:01,557][97397] Num frames 15700... +[2023-09-14 12:04:01,944][97397] Num frames 15800... +[2023-09-14 12:04:02,232][97397] Num frames 15900... +[2023-09-14 12:04:02,472][97397] Num frames 16000... +[2023-09-14 12:04:02,712][97397] Num frames 16100... +[2023-09-14 12:04:02,938][97397] Num frames 16200... +[2023-09-14 12:04:03,185][97397] Num frames 16300... +[2023-09-14 12:04:03,427][97397] Num frames 16400... +[2023-09-14 12:04:03,697][97397] Num frames 16500... +[2023-09-14 12:04:03,945][97397] Num frames 16600... +[2023-09-14 12:04:04,170][97397] Num frames 16700... +[2023-09-14 12:04:04,458][97397] DAMAGECOUNT value on done: 45.0 +[2023-09-14 12:04:04,458][97397] DAMAGECOUNT value on done: 37.0 +[2023-09-14 12:04:04,460][97397] Sum rewards: 14.910, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.025', 'AMMO3': '0.040', 'AMMO4': '0.123', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.450', 'weapon5': '0.666', 'weapon2': '0.872', 'weapon4': '1.078', 'weapon3': '12.950'} +[2023-09-14 12:04:04,523][97397] Avg episode rewards: #0: 11.004, #1: 14.613, true rewards: #0: 1.000, #1: 0.000 +[2023-09-14 12:04:04,524][97397] Avg episode reward: 12.809, avg true_objective: 0.500 +[2023-09-14 12:04:04,537][97397] Num frames 16800... +[2023-09-14 12:04:04,881][97397] Num frames 16900... +[2023-09-14 12:04:05,221][97397] Num frames 17000... +[2023-09-14 12:04:05,516][97397] Num frames 17100... +[2023-09-14 12:04:05,777][97397] Num frames 17200... +[2023-09-14 12:04:06,013][97397] Num frames 17300... +[2023-09-14 12:04:06,260][97397] Num frames 17400... +[2023-09-14 12:04:06,504][97397] Num frames 17500... +[2023-09-14 12:04:06,754][97397] Num frames 17600... +[2023-09-14 12:04:07,073][97397] Num frames 17700... +[2023-09-14 12:04:07,350][97397] Num frames 17800... +[2023-09-14 12:04:07,602][97397] Num frames 17900... +[2023-09-14 12:04:07,903][97397] Num frames 18000... +[2023-09-14 12:04:08,237][97397] Num frames 18100... +[2023-09-14 12:04:08,546][97397] Num frames 18200... +[2023-09-14 12:04:08,776][97397] Num frames 18300... +[2023-09-14 12:04:09,022][97397] Num frames 18400... +[2023-09-14 12:04:09,275][97397] Num frames 18500... +[2023-09-14 12:04:09,543][97397] Num frames 18600... +[2023-09-14 12:04:09,797][97397] Num frames 18700... +[2023-09-14 12:04:10,062][97397] Num frames 18800... +[2023-09-14 12:04:10,307][97397] Num frames 18900... +[2023-09-14 12:04:10,568][97397] Num frames 19000... +[2023-09-14 12:04:10,864][97397] Num frames 19100... +[2023-09-14 12:04:11,098][97397] Num frames 19200... +[2023-09-14 12:04:11,396][97397] Num frames 19300... +[2023-09-14 12:04:11,632][97397] Num frames 19400... +[2023-09-14 12:04:11,889][97397] Num frames 19500... +[2023-09-14 12:04:12,112][97397] Num frames 19600... +[2023-09-14 12:04:12,361][97397] Num frames 19700... +[2023-09-14 12:04:12,616][97397] Num frames 19800... +[2023-09-14 12:04:12,868][97397] Num frames 19900... +[2023-09-14 12:04:13,164][97397] Num frames 20000... +[2023-09-14 12:04:13,401][97397] Num frames 20100... +[2023-09-14 12:04:13,650][97397] Num frames 20200... +[2023-09-14 12:04:13,878][97397] Num frames 20300... +[2023-09-14 12:04:14,130][97397] Num frames 20400... +[2023-09-14 12:04:14,401][97397] Num frames 20500... +[2023-09-14 12:04:14,646][97397] Num frames 20600... +[2023-09-14 12:04:14,916][97397] Num frames 20700... +[2023-09-14 12:04:15,199][97397] Num frames 20800... +[2023-09-14 12:04:15,466][97397] Num frames 20900... +[2023-09-14 12:04:15,720][97397] Num frames 21000... +[2023-09-14 12:04:15,953][97397] Num frames 21100... +[2023-09-14 12:04:16,210][97397] Num frames 21200... +[2023-09-14 12:04:16,473][97397] Num frames 21300... +[2023-09-14 12:04:16,712][97397] Num frames 21400... +[2023-09-14 12:04:16,936][97397] Num frames 21500... +[2023-09-14 12:04:17,181][97397] Num frames 21600... +[2023-09-14 12:04:17,431][97397] Num frames 21700... +[2023-09-14 12:04:17,711][97397] Num frames 21800... +[2023-09-14 12:04:17,973][97397] Num frames 21900... +[2023-09-14 12:04:18,290][97397] Num frames 22000... +[2023-09-14 12:04:18,536][97397] Num frames 22100... +[2023-09-14 12:04:18,792][97397] Num frames 22200... +[2023-09-14 12:04:19,032][97397] Num frames 22300... +[2023-09-14 12:04:19,304][97397] Num frames 22400... +[2023-09-14 12:04:19,551][97397] Num frames 22500... +[2023-09-14 12:04:19,780][97397] Num frames 22600... +[2023-09-14 12:04:20,016][97397] Num frames 22700... +[2023-09-14 12:04:20,259][97397] Num frames 22800... +[2023-09-14 12:04:20,493][97397] Num frames 22900... +[2023-09-14 12:04:20,774][97397] Num frames 23000... +[2023-09-14 12:04:21,015][97397] Num frames 23100... +[2023-09-14 12:04:21,284][97397] Num frames 23200... +[2023-09-14 12:04:21,520][97397] Num frames 23300... +[2023-09-14 12:04:21,777][97397] Num frames 23400... +[2023-09-14 12:04:22,013][97397] Num frames 23500... +[2023-09-14 12:04:22,246][97397] Num frames 23600... +[2023-09-14 12:04:22,481][97397] Num frames 23700... +[2023-09-14 12:04:22,716][97397] Num frames 23800... +[2023-09-14 12:04:22,938][97397] Num frames 23900... +[2023-09-14 12:04:23,165][97397] Num frames 24000... +[2023-09-14 12:04:23,417][97397] Num frames 24100... +[2023-09-14 12:04:23,651][97397] Num frames 24200... +[2023-09-14 12:04:23,888][97397] Num frames 24300... +[2023-09-14 12:04:24,136][97397] Num frames 24400... +[2023-09-14 12:04:24,426][97397] Num frames 24500... +[2023-09-14 12:04:24,698][97397] Num frames 24600... +[2023-09-14 12:04:24,977][97397] Num frames 24700... +[2023-09-14 12:04:25,257][97397] Num frames 24800... +[2023-09-14 12:04:25,561][97397] Num frames 24900... +[2023-09-14 12:04:25,820][97397] Num frames 25000... +[2023-09-14 12:04:26,061][97397] Num frames 25100... +[2023-09-14 12:04:26,287][97397] DAMAGECOUNT value on done: 57.0 +[2023-09-14 12:04:26,287][97397] DAMAGECOUNT value on done: 92.0 +[2023-09-14 12:04:26,289][97397] Sum rewards: 9.675, reward structure: {'HEALTH': '-1.470', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.194', 'WEAPON3': '0.200', 'DAMAGECOUNT': '0.200', 'FRAGCOUNT': '0.999', 'weapon4': '1.842', 'weapon3': '3.908', 'weapon2': '4.548'} +[2023-09-14 12:04:26,349][97397] Avg episode rewards: #0: 10.561, #1: 14.175, true rewards: #0: 0.667, #1: 0.000 +[2023-09-14 12:04:26,350][97397] Avg episode reward: 12.368, avg true_objective: 0.333 +[2023-09-14 12:04:26,366][97397] Num frames 25200... +[2023-09-14 12:04:26,632][97397] Num frames 25300... +[2023-09-14 12:04:26,901][97397] Num frames 25400... +[2023-09-14 12:04:27,185][97397] Num frames 25500... +[2023-09-14 12:04:27,438][97397] Num frames 25600... +[2023-09-14 12:04:27,679][97397] Num frames 25700... +[2023-09-14 12:04:27,927][97397] Num frames 25800... +[2023-09-14 12:04:28,205][97397] Num frames 25900... +[2023-09-14 12:04:28,498][97397] Num frames 26000... +[2023-09-14 12:04:28,782][97397] Num frames 26100... +[2023-09-14 12:04:29,072][97397] Num frames 26200... +[2023-09-14 12:04:29,342][97397] Num frames 26300... +[2023-09-14 12:04:29,583][97397] Num frames 26400... +[2023-09-14 12:04:29,847][97397] Num frames 26500... +[2023-09-14 12:04:30,142][97397] Num frames 26600... +[2023-09-14 12:04:30,414][97397] Num frames 26700... +[2023-09-14 12:04:30,661][97397] Num frames 26800... +[2023-09-14 12:04:30,920][97397] Num frames 26900... +[2023-09-14 12:04:31,202][97397] Num frames 27000... +[2023-09-14 12:04:31,434][97397] Num frames 27100... +[2023-09-14 12:04:31,674][97397] Num frames 27200... +[2023-09-14 12:04:31,932][97397] Num frames 27300... +[2023-09-14 12:04:32,167][97397] Num frames 27400... +[2023-09-14 12:04:32,386][97397] Num frames 27500... +[2023-09-14 12:04:32,608][97397] Num frames 27600... +[2023-09-14 12:04:32,825][97397] Num frames 27700... +[2023-09-14 12:04:33,072][97397] Num frames 27800... +[2023-09-14 12:04:33,312][97397] Num frames 27900... +[2023-09-14 12:04:33,547][97397] Num frames 28000... +[2023-09-14 12:04:33,792][97397] Num frames 28100... +[2023-09-14 12:04:34,030][97397] Num frames 28200... +[2023-09-14 12:04:34,284][97397] Num frames 28300... +[2023-09-14 12:04:34,553][97397] Num frames 28400... +[2023-09-14 12:04:34,800][97397] Num frames 28500... +[2023-09-14 12:04:35,057][97397] Num frames 28600... +[2023-09-14 12:04:35,314][97397] Num frames 28700... +[2023-09-14 12:04:35,562][97397] Num frames 28800... +[2023-09-14 12:04:35,795][97397] Num frames 28900... +[2023-09-14 12:04:36,036][97397] Num frames 29000... +[2023-09-14 12:04:36,266][97397] Num frames 29100... +[2023-09-14 12:04:36,503][97397] Num frames 29200... +[2023-09-14 12:04:36,746][97397] Num frames 29300... +[2023-09-14 12:04:36,998][97397] Num frames 29400... +[2023-09-14 12:04:37,247][97397] Num frames 29500... +[2023-09-14 12:04:37,505][97397] Num frames 29600... +[2023-09-14 12:04:37,756][97397] Num frames 29700... +[2023-09-14 12:04:38,028][97397] Num frames 29800... +[2023-09-14 12:04:38,291][97397] Num frames 29900... +[2023-09-14 12:04:38,536][97397] Num frames 30000... +[2023-09-14 12:04:38,793][97397] Num frames 30100... +[2023-09-14 12:04:39,048][97397] Num frames 30200... +[2023-09-14 12:04:39,301][97397] Num frames 30300... +[2023-09-14 12:04:39,549][97397] Num frames 30400... +[2023-09-14 12:04:39,782][97397] Num frames 30500... +[2023-09-14 12:04:40,014][97397] Num frames 30600... +[2023-09-14 12:04:40,252][97397] Num frames 30700... +[2023-09-14 12:04:40,496][97397] Num frames 30800... +[2023-09-14 12:04:40,722][97397] Num frames 30900... +[2023-09-14 12:04:40,973][97397] Num frames 31000... +[2023-09-14 12:04:41,282][97397] Num frames 31100... +[2023-09-14 12:04:41,538][97397] Num frames 31200... +[2023-09-14 12:04:41,780][97397] Num frames 31300... +[2023-09-14 12:04:42,016][97397] Num frames 31400... +[2023-09-14 12:04:42,248][97397] Num frames 31500... +[2023-09-14 12:04:42,486][97397] Num frames 31600... +[2023-09-14 12:04:42,725][97397] Num frames 31700... +[2023-09-14 12:04:42,998][97397] Num frames 31800... +[2023-09-14 12:04:43,261][97397] Num frames 31900... +[2023-09-14 12:04:43,498][97397] Num frames 32000... +[2023-09-14 12:04:43,801][97397] Num frames 32100... +[2023-09-14 12:04:44,104][97397] Num frames 32200... +[2023-09-14 12:04:44,403][97397] Num frames 32300... +[2023-09-14 12:04:44,690][97397] Num frames 32400... +[2023-09-14 12:04:44,949][97397] Num frames 32500... +[2023-09-14 12:04:45,237][97397] Num frames 32600... +[2023-09-14 12:04:45,499][97397] Num frames 32700... +[2023-09-14 12:04:45,739][97397] Num frames 32800... +[2023-09-14 12:04:45,990][97397] Num frames 32900... +[2023-09-14 12:04:46,252][97397] Num frames 33000... +[2023-09-14 12:04:46,510][97397] Num frames 33100... +[2023-09-14 12:04:46,742][97397] Num frames 33200... +[2023-09-14 12:04:47,033][97397] Num frames 33300... +[2023-09-14 12:04:47,284][97397] Num frames 33400... +[2023-09-14 12:04:47,556][97397] Num frames 33500... +[2023-09-14 12:04:47,799][97397] DAMAGECOUNT value on done: 342.0 +[2023-09-14 12:04:47,800][97397] DAMAGECOUNT value on done: 107.0 +[2023-09-14 12:04:47,801][97397] Sum rewards: 19.276, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.011', 'AMMO3': '0.040', 'AMMO4': '0.056', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.374', 'WEAPON3': '0.400', 'weapon4': '1.230', 'weapon2': '1.394', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.850', 'weapon3': '12.764'} +[2023-09-14 12:04:47,863][97397] Avg episode rewards: #0: 12.740, #1: 12.316, true rewards: #0: 0.750, #1: 0.000 +[2023-09-14 12:04:47,865][97397] Avg episode reward: 12.528, avg true_objective: 0.375 +[2023-09-14 12:04:47,884][97397] Num frames 33600... +[2023-09-14 12:04:48,124][97397] Num frames 33700... +[2023-09-14 12:04:48,385][97397] Num frames 33800... +[2023-09-14 12:04:48,615][97397] Num frames 33900... +[2023-09-14 12:04:48,862][97397] Num frames 34000... +[2023-09-14 12:04:49,148][97397] Num frames 34100... +[2023-09-14 12:04:49,425][97397] Num frames 34200... +[2023-09-14 12:04:49,708][97397] Num frames 34300... +[2023-09-14 12:04:49,987][97397] Num frames 34400... +[2023-09-14 12:04:50,243][97397] Num frames 34500... +[2023-09-14 12:04:50,486][97397] Num frames 34600... +[2023-09-14 12:04:50,725][97397] Num frames 34700... +[2023-09-14 12:04:50,991][97397] Num frames 34800... +[2023-09-14 12:04:51,270][97397] Num frames 34900... +[2023-09-14 12:04:51,520][97397] Num frames 35000... +[2023-09-14 12:04:51,790][97397] Num frames 35100... +[2023-09-14 12:04:52,028][97397] Num frames 35200... +[2023-09-14 12:04:52,275][97397] Num frames 35300... +[2023-09-14 12:04:52,520][97397] Num frames 35400... +[2023-09-14 12:04:52,760][97397] Num frames 35500... +[2023-09-14 12:04:52,998][97397] Num frames 35600... +[2023-09-14 12:04:53,236][97397] Num frames 35700... +[2023-09-14 12:04:53,470][97397] Num frames 35800... +[2023-09-14 12:04:53,703][97397] Num frames 35900... +[2023-09-14 12:04:53,944][97397] Num frames 36000... +[2023-09-14 12:04:54,174][97397] Num frames 36100... +[2023-09-14 12:04:54,436][97397] Num frames 36200... +[2023-09-14 12:04:54,682][97397] Num frames 36300... +[2023-09-14 12:04:54,947][97397] Num frames 36400... +[2023-09-14 12:04:55,210][97397] Num frames 36500... +[2023-09-14 12:04:55,472][97397] Num frames 36600... +[2023-09-14 12:04:55,704][97397] Num frames 36700... +[2023-09-14 12:04:55,952][97397] Num frames 36800... +[2023-09-14 12:04:56,178][97397] Num frames 36900... +[2023-09-14 12:04:56,405][97397] Num frames 37000... +[2023-09-14 12:04:56,635][97397] Num frames 37100... +[2023-09-14 12:04:56,856][97397] Num frames 37200... +[2023-09-14 12:04:57,121][97397] Num frames 37300... +[2023-09-14 12:04:57,391][97397] Num frames 37400... +[2023-09-14 12:04:57,621][97397] Num frames 37500... +[2023-09-14 12:04:57,859][97397] Num frames 37600... +[2023-09-14 12:04:58,130][97397] Num frames 37700... +[2023-09-14 12:04:58,382][97397] Num frames 37800... +[2023-09-14 12:04:58,604][97397] Num frames 37900... +[2023-09-14 12:04:58,870][97397] Num frames 38000... +[2023-09-14 12:04:59,131][97397] Num frames 38100... +[2023-09-14 12:04:59,383][97397] Num frames 38200... +[2023-09-14 12:04:59,626][97397] Num frames 38300... +[2023-09-14 12:04:59,862][97397] Num frames 38400... +[2023-09-14 12:05:00,101][97397] Num frames 38500... +[2023-09-14 12:05:00,343][97397] Num frames 38600... +[2023-09-14 12:05:00,567][97397] Num frames 38700... +[2023-09-14 12:05:00,801][97397] Num frames 38800... +[2023-09-14 12:05:01,050][97397] Num frames 38900... +[2023-09-14 12:05:01,337][97397] Num frames 39000... +[2023-09-14 12:05:01,608][97397] Num frames 39100... +[2023-09-14 12:05:01,865][97397] Num frames 39200... +[2023-09-14 12:05:02,116][97397] Num frames 39300... +[2023-09-14 12:05:02,357][97397] Num frames 39400... +[2023-09-14 12:05:02,605][97397] Num frames 39500... +[2023-09-14 12:05:02,832][97397] Num frames 39600... +[2023-09-14 12:05:03,081][97397] Num frames 39700... +[2023-09-14 12:05:03,342][97397] Num frames 39800... +[2023-09-14 12:05:03,623][97397] Num frames 39900... +[2023-09-14 12:05:03,923][97397] Num frames 40000... +[2023-09-14 12:05:04,190][97397] Num frames 40100... +[2023-09-14 12:05:04,551][97397] Num frames 40200... +[2023-09-14 12:05:04,831][97397] Num frames 40300... +[2023-09-14 12:05:05,082][97397] Num frames 40400... +[2023-09-14 12:05:05,341][97397] Num frames 40500... +[2023-09-14 12:05:05,629][97397] Num frames 40600... +[2023-09-14 12:05:05,874][97397] Num frames 40700... +[2023-09-14 12:05:06,146][97397] Num frames 40800... +[2023-09-14 12:05:06,386][97397] Num frames 40900... +[2023-09-14 12:05:06,633][97397] Num frames 41000... +[2023-09-14 12:05:06,869][97397] Num frames 41100... +[2023-09-14 12:05:07,142][97397] Num frames 41200... +[2023-09-14 12:05:07,416][97397] Num frames 41300... +[2023-09-14 12:05:07,719][97397] Num frames 41400... +[2023-09-14 12:05:07,962][97397] Num frames 41500... +[2023-09-14 12:05:08,222][97397] Num frames 41600... +[2023-09-14 12:05:08,472][97397] Num frames 41700... +[2023-09-14 12:05:08,727][97397] Num frames 41800... +[2023-09-14 12:05:08,963][97397] Num frames 41900... +[2023-09-14 12:05:09,207][97397] DAMAGECOUNT value on done: 442.0 +[2023-09-14 12:05:09,207][97397] DAMAGECOUNT value on done: 282.0 +[2023-09-14 12:05:09,208][97397] Sum rewards: 12.061, reward structure: {'HEALTH': '-2.400', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.004', 'AMMO4': '0.020', 'AMMO3': '0.050', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.400', 'weapon5': '0.556', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon4': '1.958', 'weapon2': '2.464', 'weapon3': '8.806'} +[2023-09-14 12:05:09,209][97397] Sum rewards: 11.181, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO4': '0.025', 'AMMO3': '0.037', 'WEAPON4': '0.100', 'WEAPON3': '0.300', 'weapon4': '0.702', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.750', 'weapon2': '3.640', 'weapon3': '5.622'} +[2023-09-14 12:05:09,273][97397] Avg episode rewards: #0: 12.604, #1: 12.089, true rewards: #0: 0.600, #1: 0.200 +[2023-09-14 12:05:09,275][97397] Avg episode reward: 12.346, avg true_objective: 0.400 +[2023-09-14 12:06:30,025][109198] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... +[2023-09-14 12:06:30,143][109198] Rollout worker 0 uses device cpu +[2023-09-14 12:06:30,145][109198] Rollout worker 1 uses device cpu +[2023-09-14 12:06:30,146][109198] Rollout worker 2 uses device cpu +[2023-09-14 12:06:30,147][109198] Rollout worker 3 uses device cpu +[2023-09-14 12:06:30,150][109198] Rollout worker 4 uses device cpu +[2023-09-14 12:06:30,151][109198] Rollout worker 5 uses device cpu +[2023-09-14 12:06:30,153][109198] Rollout worker 6 uses device cpu +[2023-09-14 12:06:30,154][109198] Rollout worker 7 uses device cpu +[2023-09-14 12:06:30,236][109198] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:06:30,237][109198] InferenceWorker_p0-w0: min num requests: 2 +[2023-09-14 12:06:30,263][109198] Starting all processes... +[2023-09-14 12:06:30,265][109198] Starting process learner_proc0 +[2023-09-14 12:06:31,849][109198] Starting all processes... +[2023-09-14 12:06:31,850][112382] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:06:31,851][112382] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 +[2023-09-14 12:06:31,857][109198] Starting process inference_proc0-0 +[2023-09-14 12:06:31,858][109198] Starting process rollout_proc0 +[2023-09-14 12:06:31,858][109198] Starting process rollout_proc1 +[2023-09-14 12:06:31,859][109198] Starting process rollout_proc2 +[2023-09-14 12:06:31,860][109198] Starting process rollout_proc3 +[2023-09-14 12:06:31,860][109198] Starting process rollout_proc4 +[2023-09-14 12:06:31,864][109198] Starting process rollout_proc5 +[2023-09-14 12:06:31,890][112382] Num visible devices: 1 +[2023-09-14 12:06:31,869][109198] Starting process rollout_proc6 +[2023-09-14 12:06:31,871][109198] Starting process rollout_proc7 +[2023-09-14 12:06:31,929][112382] Starting seed is not provided +[2023-09-14 12:06:31,929][112382] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:06:31,930][112382] Initializing actor-critic model on device cuda:0 +[2023-09-14 12:06:31,930][112382] RunningMeanStd input shape: (23,) +[2023-09-14 12:06:31,931][112382] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:06:31,931][112382] RunningMeanStd input shape: (1,) +[2023-09-14 12:06:31,950][112382] ConvEncoder: input_channels=3 +[2023-09-14 12:06:32,132][112382] Conv encoder output size: 512 +[2023-09-14 12:06:32,133][112382] Policy head output size: 640 +[2023-09-14 12:06:32,150][112382] Created Actor Critic model with architecture: +[2023-09-14 12:06:32,151][112382] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (measurements): RunningMeanStdInPlace() + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): VizdoomEncoder( + (basic_encoder): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ELU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ELU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ELU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ELU) + ) + ) + ) + (measurements_head): Sequential( + (0): Linear(in_features=23, out_features=128, bias=True) + (1): ELU(alpha=1.0) + (2): Linear(in_features=128, out_features=128, bias=True) + (3): ELU(alpha=1.0) + ) + ) + (core): ModelCoreRNN( + (core): GRU(640, 512) + ) + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=41, bias=True) + ) +) +[2023-09-14 12:06:33,249][112382] Using optimizer +[2023-09-14 12:06:33,249][112382] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000246_1007616.pth... +[2023-09-14 12:06:33,278][112382] Loading model from checkpoint +[2023-09-14 12:06:33,283][112382] Loaded experiment state at self.train_step=246, self.env_steps=1007616 +[2023-09-14 12:06:33,283][112382] Initialized policy 0 weights for model version 246 +[2023-09-14 12:06:33,285][112382] LearnerWorker_p0 finished initialization! +[2023-09-14 12:06:33,285][112382] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:06:33,623][112529] Worker 0 uses CPU cores [0, 1, 2, 3] +[2023-09-14 12:06:33,810][112541] Worker 6 uses CPU cores [24, 25, 26, 27] +[2023-09-14 12:06:33,828][112539] Worker 3 uses CPU cores [12, 13, 14, 15] +[2023-09-14 12:06:33,831][112530] Worker 1 uses CPU cores [4, 5, 6, 7] +[2023-09-14 12:06:33,843][112540] Worker 5 uses CPU cores [20, 21, 22, 23] +[2023-09-14 12:06:33,919][112536] Worker 2 uses CPU cores [8, 9, 10, 11] +[2023-09-14 12:06:34,066][112519] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:06:34,066][112519] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 +[2023-09-14 12:06:34,084][112519] Num visible devices: 1 +[2023-09-14 12:06:34,225][112573] Worker 7 uses CPU cores [28, 29, 30, 31] +[2023-09-14 12:06:34,435][112538] Worker 4 uses CPU cores [16, 17, 18, 19] +[2023-09-14 12:06:34,719][112519] RunningMeanStd input shape: (23,) +[2023-09-14 12:06:34,720][112519] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:06:34,720][112519] RunningMeanStd input shape: (1,) +[2023-09-14 12:06:34,732][112519] ConvEncoder: input_channels=3 +[2023-09-14 12:06:34,840][112519] Conv encoder output size: 512 +[2023-09-14 12:06:34,841][112519] Policy head output size: 640 +[2023-09-14 12:06:35,131][109198] Inference worker 0-0 is ready! +[2023-09-14 12:06:35,132][109198] All inference workers are ready! Signal rollout workers to start! +[2023-09-14 12:06:35,136][112540] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,136][112530] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,136][112538] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,136][112541] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,136][112536] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,138][112539] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,139][112529] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,140][112573] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,173][112539] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:06:35,174][112529] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:06:35,175][112573] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:06:35,176][112539] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,177][112529] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,178][112573] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,183][112530] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:06:35,183][112538] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:06:35,183][112540] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:06:35,186][112541] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:06:35,186][112536] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:06:35,187][112530] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,187][112538] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,187][112540] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,190][112541] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,190][112536] Multi agent env, num agents: 2 +[2023-09-14 12:06:35,207][112529] Port 40300 is available +[2023-09-14 12:06:35,207][112529] Using port 40300 +[2023-09-14 12:06:35,208][112573] UDP port 41000 cannot be used [Errno 98] Address already in use +[2023-09-14 12:06:35,208][112573] Port 42000 is available +[2023-09-14 12:06:35,208][112573] Using port 42000 +[2023-09-14 12:06:35,208][112529] Initializing env for player 0, init_info: {'port': 40300}... +[2023-09-14 12:06:35,209][112573] Initializing env for player 0, init_info: {'port': 42000}... +[2023-09-14 12:06:35,213][112539] Port 40600 is available +[2023-09-14 12:06:35,213][112539] Using port 40600 +[2023-09-14 12:06:35,214][112539] Initializing env for player 0, init_info: {'port': 40600}... +[2023-09-14 12:06:35,233][112530] Port 40400 is available +[2023-09-14 12:06:35,233][112530] Using port 40400 +[2023-09-14 12:06:35,233][112540] Port 40800 is available +[2023-09-14 12:06:35,234][112540] Using port 40800 +[2023-09-14 12:06:35,234][112538] Port 40700 is available +[2023-09-14 12:06:35,234][112538] Using port 40700 +[2023-09-14 12:06:35,234][112530] Initializing env for player 0, init_info: {'port': 40400}... +[2023-09-14 12:06:35,234][112540] Initializing env for player 0, init_info: {'port': 40800}... +[2023-09-14 12:06:35,235][112538] Initializing env for player 0, init_info: {'port': 40700}... +[2023-09-14 12:06:35,239][112573] Using port 42000 on host... +[2023-09-14 12:06:35,240][112541] Port 40900 is available +[2023-09-14 12:06:35,240][112536] Port 40500 is available +[2023-09-14 12:06:35,240][112541] Using port 40900 +[2023-09-14 12:06:35,240][112536] Using port 40500 +[2023-09-14 12:06:35,241][112536] Initializing env for player 0, init_info: {'port': 40500}... +[2023-09-14 12:06:35,245][112529] Using port 40300 on host... +[2023-09-14 12:06:35,248][112539] Using port 40600 on host... +[2023-09-14 12:06:35,259][112529] Initializing env for player 1, init_info: {'port': 40300}... +[2023-09-14 12:06:35,260][112573] Initializing env for player 1, init_info: {'port': 42000}... +[2023-09-14 12:06:35,264][112539] Initializing env for player 1, init_info: {'port': 40600}... +[2023-09-14 12:06:35,267][112540] Using port 40800 on host... +[2023-09-14 12:06:35,269][112530] Using port 40400 on host... +[2023-09-14 12:06:35,275][112536] Using port 40500 on host... +[2023-09-14 12:06:35,275][112538] Using port 40700 on host... +[2023-09-14 12:06:35,285][112530] Initializing env for player 1, init_info: {'port': 40400}... +[2023-09-14 12:06:35,285][112540] Initializing env for player 1, init_info: {'port': 40800}... +[2023-09-14 12:06:35,286][112538] Initializing env for player 1, init_info: {'port': 40700}... +[2023-09-14 12:06:35,291][112536] Initializing env for player 1, init_info: {'port': 40500}... +[2023-09-14 12:06:36,182][109198] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 1007616. Throughput: 0: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:06:36,360][112540] Initialized w:5 v:0 player:0 +[2023-09-14 12:06:36,361][112540] Initialized w:5 v:0 player:1 +[2023-09-14 12:06:36,362][112540] 2 agent workers initialized for env 5! +[2023-09-14 12:06:36,370][112540] Decorrelating experience for 0 frames... +[2023-09-14 12:06:36,370][112540] Port 40801 is available +[2023-09-14 12:06:36,370][112540] Using port 40801 +[2023-09-14 12:06:36,371][112540] Initializing env for player 0, init_info: {'port': 40801}... +[2023-09-14 12:06:36,395][112539] Initialized w:3 v:0 player:0 +[2023-09-14 12:06:36,396][112539] Initialized w:3 v:0 player:1 +[2023-09-14 12:06:36,398][112539] 2 agent workers initialized for env 3! +[2023-09-14 12:06:36,399][112540] Using port 40801 on host... +[2023-09-14 12:06:36,408][112539] Decorrelating experience for 0 frames... +[2023-09-14 12:06:36,409][112539] Port 40601 is available +[2023-09-14 12:06:36,409][112539] Using port 40601 +[2023-09-14 12:06:36,410][112539] Initializing env for player 0, init_info: {'port': 40601}... +[2023-09-14 12:06:36,411][112573] Initialized w:7 v:0 player:0 +[2023-09-14 12:06:36,411][112573] Initialized w:7 v:0 player:1 +[2023-09-14 12:06:36,413][112573] 2 agent workers initialized for env 7! +[2023-09-14 12:06:36,414][112536] Initialized w:2 v:0 player:0 +[2023-09-14 12:06:36,415][112536] Initialized w:2 v:0 player:1 +[2023-09-14 12:06:36,417][112536] 2 agent workers initialized for env 2! +[2023-09-14 12:06:36,420][112573] Decorrelating experience for 0 frames... +[2023-09-14 12:06:36,421][112573] UDP port 41001 cannot be used [Errno 98] Address already in use +[2023-09-14 12:06:36,421][112573] Port 42001 is available +[2023-09-14 12:06:36,421][112573] Using port 42001 +[2023-09-14 12:06:36,422][112540] Initializing env for player 1, init_info: {'port': 40801}... +[2023-09-14 12:06:36,426][112538] Initialized w:4 v:0 player:1 +[2023-09-14 12:06:36,427][112538] Initialized w:4 v:0 player:0 +[2023-09-14 12:06:36,428][112538] 2 agent workers initialized for env 4! +[2023-09-14 12:06:36,429][112536] Decorrelating experience for 0 frames... +[2023-09-14 12:06:36,430][112536] Port 40501 is available +[2023-09-14 12:06:36,430][112536] Using port 40501 +[2023-09-14 12:06:36,432][112536] Initializing env for player 0, init_info: {'port': 40501}... +[2023-09-14 12:06:36,439][112539] Using port 40601 on host... +[2023-09-14 12:06:36,442][112538] Decorrelating experience for 0 frames... +[2023-09-14 12:06:36,444][112538] Port 40701 is available +[2023-09-14 12:06:36,444][112538] Using port 40701 +[2023-09-14 12:06:36,444][112530] Initialized w:1 v:0 player:0 +[2023-09-14 12:06:36,444][112530] Initialized w:1 v:0 player:1 +[2023-09-14 12:06:36,446][112530] 2 agent workers initialized for env 1! +[2023-09-14 12:06:36,453][112541] Initializing env for player 0, init_info: {'port': 40900}... +[2023-09-14 12:06:36,457][112530] Decorrelating experience for 0 frames... +[2023-09-14 12:06:36,460][112539] Initializing env for player 1, init_info: {'port': 40601}... +[2023-09-14 12:06:36,465][112536] Using port 40501 on host... +[2023-09-14 12:06:36,471][112530] Port 40401 is available +[2023-09-14 12:06:36,471][112530] Using port 40401 +[2023-09-14 12:06:36,482][112536] Initializing env for player 1, init_info: {'port': 40501}... +[2023-09-14 12:06:36,485][112541] Using port 40900 on host... +[2023-09-14 12:06:36,503][112541] Initializing env for player 1, init_info: {'port': 40900}... +[2023-09-14 12:06:36,611][112529] Initialized w:0 v:0 player:1 +[2023-09-14 12:06:36,611][112529] Initialized w:0 v:0 player:0 +[2023-09-14 12:06:36,613][112529] 2 agent workers initialized for env 0! +[2023-09-14 12:06:36,624][112529] Decorrelating experience for 0 frames... +[2023-09-14 12:06:36,625][112529] Port 40301 is available +[2023-09-14 12:06:36,625][112529] Using port 40301 +[2023-09-14 12:06:36,626][112529] Initializing env for player 0, init_info: {'port': 40301}... +[2023-09-14 12:06:36,655][112529] Using port 40301 on host... +[2023-09-14 12:06:36,676][112529] Initializing env for player 1, init_info: {'port': 40301}... +[2023-09-14 12:06:37,482][112540] Initialized w:5 v:1 player:0 +[2023-09-14 12:06:37,482][112540] Initialized w:5 v:1 player:1 +[2023-09-14 12:06:37,484][112540] 2 agent workers initialized for env 5! +[2023-09-14 12:06:37,488][112530] Initializing env for player 0, init_info: {'port': 40401}... +[2023-09-14 12:06:37,496][112540] Decorrelating experience for 32 frames... +[2023-09-14 12:06:37,500][112539] Initialized w:3 v:1 player:1 +[2023-09-14 12:06:37,501][112539] Initialized w:3 v:1 player:0 +[2023-09-14 12:06:37,502][112539] 2 agent workers initialized for env 3! +[2023-09-14 12:06:37,508][112536] Initialized w:2 v:1 player:0 +[2023-09-14 12:06:37,508][112536] Initialized w:2 v:1 player:1 +[2023-09-14 12:06:37,509][112536] 2 agent workers initialized for env 2! +[2023-09-14 12:06:37,511][112538] Initializing env for player 0, init_info: {'port': 40701}... +[2023-09-14 12:06:37,511][112539] Decorrelating experience for 32 frames... +[2023-09-14 12:06:37,518][112536] Decorrelating experience for 32 frames... +[2023-09-14 12:06:37,534][112530] Using port 40401 on host... +[2023-09-14 12:06:37,539][112530] Initializing env for player 1, init_info: {'port': 40401}... +[2023-09-14 12:06:37,546][112538] Using port 40701 on host... +[2023-09-14 12:06:37,561][112538] Initializing env for player 1, init_info: {'port': 40701}... +[2023-09-14 12:06:37,580][112536] Multi agent env, num agents: 2 +[2023-09-14 12:06:37,582][112539] Multi agent env, num agents: 2 +[2023-09-14 12:06:37,583][112540] Multi agent env, num agents: 2 +[2023-09-14 12:06:37,611][112536] Multi agent env, num agents: 2 +[2023-09-14 12:06:37,612][112539] Multi agent env, num agents: 2 +[2023-09-14 12:06:37,620][112541] Initialized w:6 v:0 player:1 +[2023-09-14 12:06:37,621][112541] Initialized w:6 v:0 player:0 +[2023-09-14 12:06:37,623][112541] 2 agent workers initialized for env 6! +[2023-09-14 12:06:37,629][112540] Multi agent env, num agents: 2 +[2023-09-14 12:06:37,634][112541] Decorrelating experience for 0 frames... +[2023-09-14 12:06:37,634][112573] Initializing env for player 0, init_info: {'port': 42001}... +[2023-09-14 12:06:37,635][112541] Port 40901 is available +[2023-09-14 12:06:37,635][112541] Using port 40901 +[2023-09-14 12:06:37,636][112541] Initializing env for player 0, init_info: {'port': 40901}... +[2023-09-14 12:06:37,642][112539] Port 40602 is available +[2023-09-14 12:06:37,642][112539] Using port 40602 +[2023-09-14 12:06:37,642][112536] Port 40502 is available +[2023-09-14 12:06:37,642][112536] Using port 40502 +[2023-09-14 12:06:37,643][112536] Initializing env for player 0, init_info: {'port': 40502}... +[2023-09-14 12:06:37,643][112539] Initializing env for player 0, init_info: {'port': 40602}... +[2023-09-14 12:06:37,662][112540] Port 40802 is available +[2023-09-14 12:06:37,662][112540] Using port 40802 +[2023-09-14 12:06:37,663][112540] Initializing env for player 0, init_info: {'port': 40802}... +[2023-09-14 12:06:37,665][112541] Using port 40901 on host... +[2023-09-14 12:06:37,684][112536] Using port 40502 on host... +[2023-09-14 12:06:37,684][112573] Initializing env for player 1, init_info: {'port': 42001}... +[2023-09-14 12:06:37,686][112541] Initializing env for player 1, init_info: {'port': 40901}... +[2023-09-14 12:06:37,687][112573] Using port 42001 on host... +[2023-09-14 12:06:37,691][112539] Using port 40602 on host... +[2023-09-14 12:06:37,695][112536] Initializing env for player 1, init_info: {'port': 40502}... +[2023-09-14 12:06:37,698][112539] Initializing env for player 1, init_info: {'port': 40602}... +[2023-09-14 12:06:37,707][112540] Using port 40802 on host... +[2023-09-14 12:06:37,717][112540] Initializing env for player 1, init_info: {'port': 40802}... +[2023-09-14 12:06:37,723][112529] Initialized w:0 v:1 player:0 +[2023-09-14 12:06:37,724][112529] Initialized w:0 v:1 player:1 +[2023-09-14 12:06:37,726][112529] 2 agent workers initialized for env 0! +[2023-09-14 12:06:37,744][112529] Decorrelating experience for 32 frames... +[2023-09-14 12:06:37,828][112529] Multi agent env, num agents: 2 +[2023-09-14 12:06:37,871][112529] Multi agent env, num agents: 2 +[2023-09-14 12:06:37,899][112529] Port 40302 is available +[2023-09-14 12:06:37,899][112529] Using port 40302 +[2023-09-14 12:06:38,606][112538] Initialized w:4 v:1 player:1 +[2023-09-14 12:06:38,607][112538] Initialized w:4 v:1 player:0 +[2023-09-14 12:06:38,609][112538] 2 agent workers initialized for env 4! +[2023-09-14 12:06:38,622][112538] Decorrelating experience for 32 frames... +[2023-09-14 12:06:38,691][112538] Multi agent env, num agents: 2 +[2023-09-14 12:06:38,721][112538] Multi agent env, num agents: 2 +[2023-09-14 12:06:38,745][112530] Initialized w:1 v:1 player:0 +[2023-09-14 12:06:38,745][112530] Initialized w:1 v:1 player:1 +[2023-09-14 12:06:38,746][112530] 2 agent workers initialized for env 1! +[2023-09-14 12:06:38,751][112538] Port 40702 is available +[2023-09-14 12:06:38,751][112538] Using port 40702 +[2023-09-14 12:06:38,751][112538] Initializing env for player 0, init_info: {'port': 40702}... +[2023-09-14 12:06:38,752][112541] Initialized w:6 v:1 player:0 +[2023-09-14 12:06:38,753][112541] Initialized w:6 v:1 player:1 +[2023-09-14 12:06:38,753][112536] Initialized w:2 v:2 player:1 +[2023-09-14 12:06:38,754][112536] Initialized w:2 v:2 player:0 +[2023-09-14 12:06:38,755][112541] 2 agent workers initialized for env 6! +[2023-09-14 12:06:38,756][112536] 2 agent workers initialized for env 2! +[2023-09-14 12:06:38,757][112530] Decorrelating experience for 32 frames... +[2023-09-14 12:06:38,766][112541] Decorrelating experience for 32 frames... +[2023-09-14 12:06:38,767][112536] Decorrelating experience for 64 frames... +[2023-09-14 12:06:38,784][112538] Using port 40702 on host... +[2023-09-14 12:06:38,802][112538] Initializing env for player 1, init_info: {'port': 40702}... +[2023-09-14 12:06:38,822][112573] Initialized w:7 v:1 player:1 +[2023-09-14 12:06:38,822][112573] Initialized w:7 v:1 player:0 +[2023-09-14 12:06:38,824][112573] 2 agent workers initialized for env 7! +[2023-09-14 12:06:38,825][112530] Multi agent env, num agents: 2 +[2023-09-14 12:06:38,835][112573] Decorrelating experience for 32 frames... +[2023-09-14 12:06:38,843][112541] Multi agent env, num agents: 2 +[2023-09-14 12:06:38,860][112529] Initializing env for player 0, init_info: {'port': 40302}... +[2023-09-14 12:06:38,869][112539] Initialized w:3 v:2 player:1 +[2023-09-14 12:06:38,871][112539] Initialized w:3 v:2 player:0 +[2023-09-14 12:06:38,871][112539] 2 agent workers initialized for env 3! +[2023-09-14 12:06:38,871][112530] Multi agent env, num agents: 2 +[2023-09-14 12:06:38,879][112541] Multi agent env, num agents: 2 +[2023-09-14 12:06:38,881][112539] Decorrelating experience for 64 frames... +[2023-09-14 12:06:38,904][112529] Using port 40302 on host... +[2023-09-14 12:06:38,914][112529] Initializing env for player 1, init_info: {'port': 40302}... +[2023-09-14 12:06:38,915][112541] Port 40902 is available +[2023-09-14 12:06:38,915][112541] Using port 40902 +[2023-09-14 12:06:38,915][112573] Multi agent env, num agents: 2 +[2023-09-14 12:06:38,915][112536] Port 40503 is available +[2023-09-14 12:06:38,915][112536] Using port 40503 +[2023-09-14 12:06:38,916][112541] Initializing env for player 0, init_info: {'port': 40902}... +[2023-09-14 12:06:38,916][112536] Initializing env for player 0, init_info: {'port': 40503}... +[2023-09-14 12:06:38,917][112530] Port 40402 is available +[2023-09-14 12:06:38,917][112530] Using port 40402 +[2023-09-14 12:06:38,918][112530] Initializing env for player 0, init_info: {'port': 40402}... +[2023-09-14 12:06:38,918][112540] Initialized w:5 v:2 player:1 +[2023-09-14 12:06:38,919][112540] Initialized w:5 v:2 player:0 +[2023-09-14 12:06:38,921][112540] 2 agent workers initialized for env 5! +[2023-09-14 12:06:38,932][112540] Decorrelating experience for 64 frames... +[2023-09-14 12:06:38,944][112541] Using port 40902 on host... +[2023-09-14 12:06:38,945][112536] Using port 40503 on host... +[2023-09-14 12:06:38,953][112573] Multi agent env, num agents: 2 +[2023-09-14 12:06:38,955][112530] Using port 40402 on host... +[2023-09-14 12:06:38,966][112541] Initializing env for player 1, init_info: {'port': 40902}... +[2023-09-14 12:06:38,966][112536] Initializing env for player 1, init_info: {'port': 40503}... +[2023-09-14 12:06:38,968][112530] Initializing env for player 1, init_info: {'port': 40402}... +[2023-09-14 12:06:38,988][112573] UDP port 41002 cannot be used [Errno 98] Address already in use +[2023-09-14 12:06:38,988][112573] Port 42002 is available +[2023-09-14 12:06:38,988][112573] Using port 42002 +[2023-09-14 12:06:38,989][112573] Initializing env for player 0, init_info: {'port': 42002}... +[2023-09-14 12:06:39,022][112573] Using port 42002 on host... +[2023-09-14 12:06:39,028][112539] Port 40603 is available +[2023-09-14 12:06:39,028][112539] Using port 40603 +[2023-09-14 12:06:39,029][112539] Initializing env for player 0, init_info: {'port': 40603}... +[2023-09-14 12:06:39,039][112573] Initializing env for player 1, init_info: {'port': 42002}... +[2023-09-14 12:06:39,069][112539] Using port 40603 on host... +[2023-09-14 12:06:39,079][112539] Initializing env for player 1, init_info: {'port': 40603}... +[2023-09-14 12:06:39,095][112540] Port 40803 is available +[2023-09-14 12:06:39,095][112540] Using port 40803 +[2023-09-14 12:06:39,948][112538] Initialized w:4 v:2 player:1 +[2023-09-14 12:06:39,949][112538] Initialized w:4 v:2 player:0 +[2023-09-14 12:06:39,951][112538] 2 agent workers initialized for env 4! +[2023-09-14 12:06:39,953][112540] Initializing env for player 0, init_info: {'port': 40803}... +[2023-09-14 12:06:39,967][112538] Decorrelating experience for 64 frames... +[2023-09-14 12:06:39,998][112540] Using port 40803 on host... +[2023-09-14 12:06:40,006][112540] Initializing env for player 1, init_info: {'port': 40803}... +[2023-09-14 12:06:40,027][112529] Initialized w:0 v:2 player:0 +[2023-09-14 12:06:40,028][112529] Initialized w:0 v:2 player:1 +[2023-09-14 12:06:40,029][112529] 2 agent workers initialized for env 0! +[2023-09-14 12:06:40,037][112529] Decorrelating experience for 64 frames... +[2023-09-14 12:06:40,044][112536] Initialized w:2 v:3 player:0 +[2023-09-14 12:06:40,045][112536] Initialized w:2 v:3 player:1 +[2023-09-14 12:06:40,046][112536] 2 agent workers initialized for env 2! +[2023-09-14 12:06:40,058][112536] Decorrelating experience for 96 frames... +[2023-09-14 12:06:40,072][112530] Initialized w:1 v:2 player:0 +[2023-09-14 12:06:40,073][112530] Initialized w:1 v:2 player:1 +[2023-09-14 12:06:40,074][112530] 2 agent workers initialized for env 1! +[2023-09-14 12:06:40,076][112541] Initialized w:6 v:2 player:1 +[2023-09-14 12:06:40,077][112541] Initialized w:6 v:2 player:0 +[2023-09-14 12:06:40,078][112541] 2 agent workers initialized for env 6! +[2023-09-14 12:06:40,083][112530] Decorrelating experience for 64 frames... +[2023-09-14 12:06:40,086][112541] Decorrelating experience for 64 frames... +[2023-09-14 12:06:40,114][112538] Port 40703 is available +[2023-09-14 12:06:40,115][112538] Using port 40703 +[2023-09-14 12:06:40,115][112538] Initializing env for player 0, init_info: {'port': 40703}... +[2023-09-14 12:06:40,152][112538] Using port 40703 on host... +[2023-09-14 12:06:40,166][112538] Initializing env for player 1, init_info: {'port': 40703}... +[2023-09-14 12:06:40,182][112529] Port 40303 is available +[2023-09-14 12:06:40,182][112529] Using port 40303 +[2023-09-14 12:06:40,182][112529] Initializing env for player 0, init_info: {'port': 40303}... +[2023-09-14 12:06:40,211][112529] Using port 40303 on host... +[2023-09-14 12:06:40,218][112573] Initialized w:7 v:2 player:0 +[2023-09-14 12:06:40,219][112573] Initialized w:7 v:2 player:1 +[2023-09-14 12:06:40,219][112573] 2 agent workers initialized for env 7! +[2023-09-14 12:06:40,226][112539] Initialized w:3 v:3 player:1 +[2023-09-14 12:06:40,227][112541] Port 40903 is available +[2023-09-14 12:06:40,227][112541] Using port 40903 +[2023-09-14 12:06:40,227][112539] Initialized w:3 v:3 player:0 +[2023-09-14 12:06:40,228][112539] 2 agent workers initialized for env 3! +[2023-09-14 12:06:40,229][112573] Decorrelating experience for 64 frames... +[2023-09-14 12:06:40,233][112529] Initializing env for player 1, init_info: {'port': 40303}... +[2023-09-14 12:06:40,237][112539] Decorrelating experience for 96 frames... +[2023-09-14 12:06:40,239][112530] Port 40403 is available +[2023-09-14 12:06:40,240][112530] Using port 40403 +[2023-09-14 12:06:40,240][112530] Initializing env for player 0, init_info: {'port': 40403}... +[2023-09-14 12:06:40,285][112530] Using port 40403 on host... +[2023-09-14 12:06:40,294][112530] Initializing env for player 1, init_info: {'port': 40403}... +[2023-09-14 12:06:40,370][112573] Port 41003 is available +[2023-09-14 12:06:40,370][112573] Using port 41003 +[2023-09-14 12:06:40,371][112573] Initializing env for player 0, init_info: {'port': 41003}... +[2023-09-14 12:06:40,407][112573] Using port 41003 on host... +[2023-09-14 12:06:40,422][112573] Initializing env for player 1, init_info: {'port': 41003}... +[2023-09-14 12:06:41,123][112540] Initialized w:5 v:3 player:0 +[2023-09-14 12:06:41,123][112540] Initialized w:5 v:3 player:1 +[2023-09-14 12:06:41,124][112540] 2 agent workers initialized for env 5! +[2023-09-14 12:06:41,135][112540] Decorrelating experience for 96 frames... +[2023-09-14 12:06:41,181][109198] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 1007616. Throughput: 0: 180.8. Samples: 904. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:06:41,281][112529] Initialized w:0 v:3 player:0 +[2023-09-14 12:06:41,282][112529] Initialized w:0 v:3 player:1 +[2023-09-14 12:06:41,283][112529] 2 agent workers initialized for env 0! +[2023-09-14 12:06:41,292][112538] Initialized w:4 v:3 player:1 +[2023-09-14 12:06:41,293][112538] Initialized w:4 v:3 player:0 +[2023-09-14 12:06:41,293][112529] Decorrelating experience for 96 frames... +[2023-09-14 12:06:41,294][112538] 2 agent workers initialized for env 4! +[2023-09-14 12:06:41,296][112541] Initializing env for player 0, init_info: {'port': 40903}... +[2023-09-14 12:06:41,311][112538] Decorrelating experience for 96 frames... +[2023-09-14 12:06:41,326][112530] Initialized w:1 v:3 player:1 +[2023-09-14 12:06:41,326][112530] Initialized w:1 v:3 player:0 +[2023-09-14 12:06:41,328][112530] 2 agent workers initialized for env 1! +[2023-09-14 12:06:41,329][112541] Using port 40903 on host... +[2023-09-14 12:06:41,346][112541] Initializing env for player 1, init_info: {'port': 40903}... +[2023-09-14 12:06:41,346][112530] Decorrelating experience for 96 frames... +[2023-09-14 12:06:41,526][112573] Initialized w:7 v:3 player:1 +[2023-09-14 12:06:42,369][112382] Signal inference workers to stop experience collection... +[2023-09-14 12:06:42,385][112541] Initialized w:6 v:3 player:1 +[2023-09-14 12:06:42,386][112541] Initialized w:6 v:3 player:0 +[2023-09-14 12:06:42,387][112541] 2 agent workers initialized for env 6! +[2023-09-14 12:06:42,394][112541] Decorrelating experience for 96 frames... +[2023-09-14 12:06:42,455][112519] InferenceWorker_p0-w0: stopping experience collection +[2023-09-14 12:06:42,525][112573] Initialized w:7 v:3 player:0 +[2023-09-14 12:06:42,527][112573] 2 agent workers initialized for env 7! +[2023-09-14 12:06:42,540][112573] Decorrelating experience for 96 frames... +[2023-09-14 12:06:44,874][112382] Signal inference workers to resume experience collection... +[2023-09-14 12:06:44,875][112519] InferenceWorker_p0-w0: resuming experience collection +[2023-09-14 12:06:44,876][112382] Stopping Batcher_0... +[2023-09-14 12:06:44,876][112382] Loop batcher_evt_loop terminating... +[2023-09-14 12:06:44,884][109198] Component Batcher_0 stopped! +[2023-09-14 12:06:45,623][112519] Weights refcount: 2 0 +[2023-09-14 12:06:45,624][112519] Stopping InferenceWorker_p0-w0... +[2023-09-14 12:06:45,625][112519] Loop inference_proc0-0_evt_loop terminating... +[2023-09-14 12:06:45,625][109198] Component InferenceWorker_p0-w0 stopped! +[2023-09-14 12:06:45,679][112540] Stopping RolloutWorker_w5... +[2023-09-14 12:06:45,679][112540] Loop rollout_proc5_evt_loop terminating... +[2023-09-14 12:06:45,679][112538] Stopping RolloutWorker_w4... +[2023-09-14 12:06:45,679][112536] Stopping RolloutWorker_w2... +[2023-09-14 12:06:45,680][112530] Stopping RolloutWorker_w1... +[2023-09-14 12:06:45,680][112530] Loop rollout_proc1_evt_loop terminating... +[2023-09-14 12:06:45,680][112538] Loop rollout_proc4_evt_loop terminating... +[2023-09-14 12:06:45,680][112539] Stopping RolloutWorker_w3... +[2023-09-14 12:06:45,680][112541] Stopping RolloutWorker_w6... +[2023-09-14 12:06:45,680][112529] Stopping RolloutWorker_w0... +[2023-09-14 12:06:45,680][112536] Loop rollout_proc2_evt_loop terminating... +[2023-09-14 12:06:45,679][109198] Component RolloutWorker_w5 stopped! +[2023-09-14 12:06:45,681][112539] Loop rollout_proc3_evt_loop terminating... +[2023-09-14 12:06:45,681][112573] Stopping RolloutWorker_w7... +[2023-09-14 12:06:45,681][112541] Loop rollout_proc6_evt_loop terminating... +[2023-09-14 12:06:45,681][112529] Loop rollout_proc0_evt_loop terminating... +[2023-09-14 12:06:45,682][112573] Loop rollout_proc7_evt_loop terminating... +[2023-09-14 12:06:45,681][109198] Component RolloutWorker_w4 stopped! +[2023-09-14 12:06:45,684][109198] Component RolloutWorker_w2 stopped! +[2023-09-14 12:06:45,686][109198] Component RolloutWorker_w1 stopped! +[2023-09-14 12:06:45,688][109198] Component RolloutWorker_w6 stopped! +[2023-09-14 12:06:45,689][109198] Component RolloutWorker_w3 stopped! +[2023-09-14 12:06:45,690][109198] Component RolloutWorker_w0 stopped! +[2023-09-14 12:06:45,691][109198] Component RolloutWorker_w7 stopped! +[2023-09-14 12:06:46,096][112382] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000248_1015808.pth... +[2023-09-14 12:06:46,152][112382] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000128_524288.pth +[2023-09-14 12:06:46,160][112382] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000248_1015808.pth... +[2023-09-14 12:06:46,221][112382] Stopping LearnerWorker_p0... +[2023-09-14 12:06:46,222][112382] Loop learner_proc0_evt_loop terminating... +[2023-09-14 12:06:46,222][109198] Component LearnerWorker_p0 stopped! +[2023-09-14 12:06:46,224][109198] Waiting for process learner_proc0 to stop... +[2023-09-14 12:06:46,809][109198] Waiting for process inference_proc0-0 to join... +[2023-09-14 12:06:46,811][109198] Waiting for process rollout_proc0 to join... +[2023-09-14 12:06:46,812][109198] Waiting for process rollout_proc1 to join... +[2023-09-14 12:06:46,814][109198] Waiting for process rollout_proc2 to join... +[2023-09-14 12:06:46,816][109198] Waiting for process rollout_proc3 to join... +[2023-09-14 12:06:46,817][109198] Waiting for process rollout_proc4 to join... +[2023-09-14 12:06:46,819][109198] Waiting for process rollout_proc5 to join... +[2023-09-14 12:06:46,820][109198] Waiting for process rollout_proc6 to join... +[2023-09-14 12:06:46,822][109198] Waiting for process rollout_proc7 to join... +[2023-09-14 12:06:46,823][109198] Batcher 0 profile tree view: +batching: 0.2217, releasing_batches: 0.0004 +[2023-09-14 12:06:46,824][109198] InferenceWorker_p0-w0 profile tree view: +wait_policy: 0.0051 + wait_policy_total: 5.3989 +update_model: 0.6777 + weight_update: 0.6688 +one_step: 0.0360 + handle_policy_step: 1.8453 + deserialize: 0.0423, stack: 0.0049, obs_to_device_normalize: 0.2151, forward: 1.4397, send_messages: 0.0292 + prepare_outputs: 0.0812 + to_cpu: 0.0434 +[2023-09-14 12:06:46,825][109198] Learner 0 profile tree view: +misc: 0.0000, prepare_batch: 2.0064 +train: 2.8124 + epoch_init: 0.0000, minibatch_init: 0.0000, losses_postprocess: 0.0004, kl_divergence: 0.0018, after_optimizer: 0.0043 + calculate_losses: 0.3365 + losses_init: 0.0000, forward_head: 0.3055, bptt_initial: 0.0129, tail: 0.0066, advantages_returns: 0.0010, losses: 0.0065 + bptt: 0.0037 + bptt_forward_core: 0.0036 + update: 2.4684 + clip: 0.0302 +[2023-09-14 12:06:46,826][109198] RolloutWorker_w0 profile tree view: +wait_for_trajectories: 0.0006, enqueue_policy_requests: 0.0167, env_step: 0.4727, overhead: 0.0092, complete_rollouts: 0.0003 +save_policy_outputs: 0.0189 + split_output_tensors: 0.0064 +[2023-09-14 12:06:46,828][109198] RolloutWorker_w7 profile tree view: +wait_for_trajectories: 0.0004, enqueue_policy_requests: 0.0008 +[2023-09-14 12:06:46,829][109198] Loop Runner_EvtLoop terminating... +[2023-09-14 12:06:46,830][109198] Runner profile tree view: +main_loop: 16.5670 +[2023-09-14 12:06:46,831][109198] Collected {0: 1015808}, FPS: 494.5 +[2023-09-14 12:06:46,884][109198] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json +[2023-09-14 12:06:46,885][109198] Overriding arg 'num_workers' with value 1 passed from command line +[2023-09-14 12:06:46,885][109198] Adding new argument 'no_render'=True that is not in the saved config file! +[2023-09-14 12:06:46,886][109198] Adding new argument 'save_video'=True that is not in the saved config file! +[2023-09-14 12:06:46,887][109198] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file! +[2023-09-14 12:06:46,888][109198] Adding new argument 'video_name'=None that is not in the saved config file! +[2023-09-14 12:06:46,889][109198] Adding new argument 'max_num_frames'=100000 that is not in the saved config file! +[2023-09-14 12:06:46,889][109198] Adding new argument 'max_num_episodes'=10 that is not in the saved config file! +[2023-09-14 12:06:46,890][109198] Adding new argument 'push_to_hub'=True that is not in the saved config file! +[2023-09-14 12:06:46,891][109198] Adding new argument 'hf_repository'='MattStammers/vizdoom_duel' that is not in the saved config file! +[2023-09-14 12:06:46,892][109198] Adding new argument 'policy_index'=0 that is not in the saved config file! +[2023-09-14 12:06:46,893][109198] Adding new argument 'eval_deterministic'=False that is not in the saved config file! +[2023-09-14 12:06:46,893][109198] Adding new argument 'train_script'=None that is not in the saved config file! +[2023-09-14 12:06:46,894][109198] Adding new argument 'enjoy_script'=None that is not in the saved config file! +[2023-09-14 12:06:46,895][109198] Using frameskip 1 and render_action_repeat=4 for evaluation +[2023-09-14 12:06:46,897][109198] Multi agent env, num agents: 2 +[2023-09-14 12:06:46,930][109198] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:06:46,934][109198] RunningMeanStd input shape: (23,) +[2023-09-14 12:06:46,935][109198] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:06:46,936][109198] RunningMeanStd input shape: (1,) +[2023-09-14 12:06:46,953][109198] ConvEncoder: input_channels=3 +[2023-09-14 12:06:47,084][109198] Conv encoder output size: 512 +[2023-09-14 12:06:47,086][109198] Policy head output size: 640 +[2023-09-14 12:06:47,963][109198] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000248_1015808.pth... +[2023-09-14 12:06:47,994][109198] Port 40300 is available +[2023-09-14 12:06:47,995][109198] Using port 40300 +[2023-09-14 12:06:47,996][109198] Initializing env for player 0, init_info: {'port': 40300}... +[2023-09-14 12:06:48,046][109198] Initializing env for player 1, init_info: {'port': 40300}... +[2023-09-14 12:06:48,096][109198] 2 agent workers initialized for env 0! +[2023-09-14 12:06:48,099][109198] Using port 40300 on host... +[2023-09-14 12:06:49,138][109198] Initialized w:0 v:0 player:0 +[2023-09-14 12:06:49,139][109198] Initialized w:0 v:0 player:1 +[2023-09-14 12:06:49,625][109198] Num frames 100... +[2023-09-14 12:06:49,914][109198] Num frames 200... +[2023-09-14 12:06:50,161][109198] Num frames 300... +[2023-09-14 12:06:50,420][109198] Num frames 400... +[2023-09-14 12:06:50,662][109198] Num frames 500... +[2023-09-14 12:06:50,922][109198] Num frames 600... +[2023-09-14 12:06:51,210][109198] Num frames 700... +[2023-09-14 12:06:51,468][109198] Num frames 800... +[2023-09-14 12:06:51,731][109198] Num frames 900... +[2023-09-14 12:06:51,962][109198] Num frames 1000... +[2023-09-14 12:06:52,201][109198] Num frames 1100... +[2023-09-14 12:06:52,452][109198] Num frames 1200... +[2023-09-14 12:06:52,694][109198] Num frames 1300... +[2023-09-14 12:06:52,925][109198] Num frames 1400... +[2023-09-14 12:06:53,158][109198] Num frames 1500... +[2023-09-14 12:06:53,400][109198] Num frames 1600... +[2023-09-14 12:06:53,626][109198] Num frames 1700... +[2023-09-14 12:06:53,851][109198] Num frames 1800... +[2023-09-14 12:06:54,085][109198] Num frames 1900... +[2023-09-14 12:06:54,372][109198] Num frames 2000... +[2023-09-14 12:06:54,599][109198] Num frames 2100... +[2023-09-14 12:06:54,845][109198] Num frames 2200... +[2023-09-14 12:06:55,082][109198] Num frames 2300... +[2023-09-14 12:06:55,309][109198] Num frames 2400... +[2023-09-14 12:06:55,590][109198] Num frames 2500... +[2023-09-14 12:06:55,872][109198] Num frames 2600... +[2023-09-14 12:06:56,120][109198] Num frames 2700... +[2023-09-14 12:06:56,356][109198] Num frames 2800... +[2023-09-14 12:06:56,605][109198] Num frames 2900... +[2023-09-14 12:06:56,849][109198] Num frames 3000... +[2023-09-14 12:06:57,134][109198] Num frames 3100... +[2023-09-14 12:06:57,384][109198] Num frames 3200... +[2023-09-14 12:06:57,673][109198] Num frames 3300... +[2023-09-14 12:06:57,931][109198] Num frames 3400... +[2023-09-14 12:06:58,202][109198] Num frames 3500... +[2023-09-14 12:06:58,469][109198] Num frames 3600... +[2023-09-14 12:06:58,724][109198] Num frames 3700... +[2023-09-14 12:06:58,980][109198] Num frames 3800... +[2023-09-14 12:06:59,248][109198] Num frames 3900... +[2023-09-14 12:06:59,475][109198] Num frames 4000... +[2023-09-14 12:06:59,735][109198] Num frames 4100... +[2023-09-14 12:06:59,981][109198] Num frames 4200... +[2023-09-14 12:07:00,233][109198] Num frames 4300... +[2023-09-14 12:07:00,463][109198] Num frames 4400... +[2023-09-14 12:07:00,680][109198] Num frames 4500... +[2023-09-14 12:07:00,935][109198] Num frames 4600... +[2023-09-14 12:07:01,224][109198] Num frames 4700... +[2023-09-14 12:07:01,515][109198] Num frames 4800... +[2023-09-14 12:07:01,773][109198] Num frames 4900... +[2023-09-14 12:07:02,022][109198] Num frames 5000... +[2023-09-14 12:07:02,280][109198] Num frames 5100... +[2023-09-14 12:07:02,515][109198] Num frames 5200... +[2023-09-14 12:07:02,750][109198] Num frames 5300... +[2023-09-14 12:07:02,976][109198] Num frames 5400... +[2023-09-14 12:07:03,206][109198] Num frames 5500... +[2023-09-14 12:07:03,432][109198] Num frames 5600... +[2023-09-14 12:07:03,682][109198] Num frames 5700... +[2023-09-14 12:07:03,919][109198] Num frames 5800... +[2023-09-14 12:07:04,155][109198] Num frames 5900... +[2023-09-14 12:07:04,443][109198] Num frames 6000... +[2023-09-14 12:07:04,717][109198] Num frames 6100... +[2023-09-14 12:07:04,959][109198] Num frames 6200... +[2023-09-14 12:07:05,189][109198] Num frames 6300... +[2023-09-14 12:07:05,459][109198] Num frames 6400... +[2023-09-14 12:07:05,718][109198] Num frames 6500... +[2023-09-14 12:07:05,988][109198] Num frames 6600... +[2023-09-14 12:07:06,226][109198] Num frames 6700... +[2023-09-14 12:07:06,493][109198] Num frames 6800... +[2023-09-14 12:07:06,725][109198] Num frames 6900... +[2023-09-14 12:07:06,991][109198] Num frames 7000... +[2023-09-14 12:07:07,252][109198] Num frames 7100... +[2023-09-14 12:07:07,509][109198] Num frames 7200... +[2023-09-14 12:07:07,746][109198] Num frames 7300... +[2023-09-14 12:07:08,020][109198] Num frames 7400... +[2023-09-14 12:07:08,315][109198] Num frames 7500... +[2023-09-14 12:07:08,574][109198] Num frames 7600... +[2023-09-14 12:07:08,810][109198] Num frames 7700... +[2023-09-14 12:07:09,049][109198] Num frames 7800... +[2023-09-14 12:07:09,306][109198] Num frames 7900... +[2023-09-14 12:07:09,550][109198] Num frames 8000... +[2023-09-14 12:07:09,777][109198] Num frames 8100... +[2023-09-14 12:07:10,024][109198] Num frames 8200... +[2023-09-14 12:07:10,242][109198] Num frames 8300... +[2023-09-14 12:07:10,470][109198] DAMAGECOUNT value on done: 110.0 +[2023-09-14 12:07:10,471][109198] DAMAGECOUNT value on done: 135.0 +[2023-09-14 12:07:10,473][109198] Sum rewards: 15.558, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.005', 'AMMO4': '0.020', 'AMMO3': '0.030', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.260', 'WEAPON3': '0.300', 'DAMAGECOUNT': '1.350', 'weapon2': '1.736', 'FRAGCOUNT': '1.999', 'weapon4': '2.518', 'weapon3': '9.286'} +[2023-09-14 12:07:10,533][109198] Avg episode rewards: #0: 13.345, #1: 15.558, true rewards: #0: 0.000, #1: 1.000 +[2023-09-14 12:07:10,534][109198] Avg episode reward: 14.451, avg true_objective: 0.500 +[2023-09-14 12:07:10,540][109198] Num frames 8400... +[2023-09-14 12:07:10,817][109198] Num frames 8500... +[2023-09-14 12:07:11,058][109198] Num frames 8600... +[2023-09-14 12:07:11,339][109198] Num frames 8700... +[2023-09-14 12:07:11,588][109198] Num frames 8800... +[2023-09-14 12:07:11,863][109198] Num frames 8900... +[2023-09-14 12:07:12,111][109198] Num frames 9000... +[2023-09-14 12:07:12,370][109198] Num frames 9100... +[2023-09-14 12:07:12,676][109198] Num frames 9200... +[2023-09-14 12:07:12,949][109198] Num frames 9300... +[2023-09-14 12:07:13,211][109198] Num frames 9400... +[2023-09-14 12:07:13,486][109198] Num frames 9500... +[2023-09-14 12:07:13,753][109198] Num frames 9600... +[2023-09-14 12:07:13,995][109198] Num frames 9700... +[2023-09-14 12:07:14,265][109198] Num frames 9800... +[2023-09-14 12:07:14,541][109198] Num frames 9900... +[2023-09-14 12:07:14,831][109198] Num frames 10000... +[2023-09-14 12:07:15,079][109198] Num frames 10100... +[2023-09-14 12:07:15,314][109198] Num frames 10200... +[2023-09-14 12:07:15,581][109198] Num frames 10300... +[2023-09-14 12:07:15,829][109198] Num frames 10400... +[2023-09-14 12:07:16,095][109198] Num frames 10500... +[2023-09-14 12:07:16,338][109198] Num frames 10600... +[2023-09-14 12:07:16,583][109198] Num frames 10700... +[2023-09-14 12:07:16,820][109198] Num frames 10800... +[2023-09-14 12:07:17,076][109198] Num frames 10900... +[2023-09-14 12:07:17,347][109198] Num frames 11000... +[2023-09-14 12:07:17,672][109198] Num frames 11100... +[2023-09-14 12:07:17,933][109198] Num frames 11200... +[2023-09-14 12:07:18,200][109198] Num frames 11300... +[2023-09-14 12:07:18,449][109198] Num frames 11400... +[2023-09-14 12:07:18,690][109198] Num frames 11500... +[2023-09-14 12:07:18,931][109198] Num frames 11600... +[2023-09-14 12:07:19,180][109198] Num frames 11700... +[2023-09-14 12:07:19,440][109198] Num frames 11800... +[2023-09-14 12:07:19,700][109198] Num frames 11900... +[2023-09-14 12:07:19,950][109198] Num frames 12000... +[2023-09-14 12:07:20,208][109198] Num frames 12100... +[2023-09-14 12:07:20,481][109198] Num frames 12200... +[2023-09-14 12:07:20,767][109198] Num frames 12300... +[2023-09-14 12:07:21,022][109198] Num frames 12400... +[2023-09-14 12:07:21,306][109198] Num frames 12500... +[2023-09-14 12:07:21,558][109198] Num frames 12600... +[2023-09-14 12:07:21,824][109198] Num frames 12700... +[2023-09-14 12:07:22,100][109198] Num frames 12800... +[2023-09-14 12:07:22,353][109198] Num frames 12900... +[2023-09-14 12:07:22,593][109198] Num frames 13000... +[2023-09-14 12:07:22,824][109198] Num frames 13100... +[2023-09-14 12:07:23,066][109198] Num frames 13200... +[2023-09-14 12:07:23,317][109198] Num frames 13300... +[2023-09-14 12:07:23,560][109198] Num frames 13400... +[2023-09-14 12:07:23,821][109198] Num frames 13500... +[2023-09-14 12:07:24,074][109198] Num frames 13600... +[2023-09-14 12:07:24,386][109198] Num frames 13700... +[2023-09-14 12:07:24,628][109198] Num frames 13800... +[2023-09-14 12:07:24,875][109198] Num frames 13900... +[2023-09-14 12:07:25,122][109198] Num frames 14000... +[2023-09-14 12:07:25,365][109198] Num frames 14100... +[2023-09-14 12:07:25,630][109198] Num frames 14200... +[2023-09-14 12:07:25,892][109198] Num frames 14300... +[2023-09-14 12:07:26,145][109198] Num frames 14400... +[2023-09-14 12:07:26,399][109198] Num frames 14500... +[2023-09-14 12:07:26,647][109198] Num frames 14600... +[2023-09-14 12:07:26,920][109198] Num frames 14700... +[2023-09-14 12:07:27,220][109198] Num frames 14800... +[2023-09-14 12:07:27,501][109198] Num frames 14900... +[2023-09-14 12:07:27,802][109198] Num frames 15000... +[2023-09-14 12:07:28,071][109198] Num frames 15100... +[2023-09-14 12:07:28,381][109198] Num frames 15200... +[2023-09-14 12:07:28,654][109198] Num frames 15300... +[2023-09-14 12:07:28,915][109198] Num frames 15400... +[2023-09-14 12:07:29,221][109198] Num frames 15500... +[2023-09-14 12:07:29,475][109198] Num frames 15600... +[2023-09-14 12:07:29,703][109198] Num frames 15700... +[2023-09-14 12:07:29,982][109198] Num frames 15800... +[2023-09-14 12:07:30,235][109198] Num frames 15900... +[2023-09-14 12:07:30,498][109198] Num frames 16000... +[2023-09-14 12:07:30,759][109198] Num frames 16100... +[2023-09-14 12:07:31,026][109198] Num frames 16200... +[2023-09-14 12:07:31,337][109198] Num frames 16300... +[2023-09-14 12:07:31,623][109198] Num frames 16400... +[2023-09-14 12:07:31,906][109198] Num frames 16500... +[2023-09-14 12:07:32,189][109198] Num frames 16600... +[2023-09-14 12:07:32,436][109198] Num frames 16700... +[2023-09-14 12:07:32,659][109198] DAMAGECOUNT value on done: 200.0 +[2023-09-14 12:07:32,659][109198] DAMAGECOUNT value on done: 250.0 +[2023-09-14 12:07:32,661][109198] Sum rewards: 14.835, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.015', 'AMMO4': '0.074', 'AMMO3': '0.078', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'weapon5': '0.564', 'WEAPON3': '0.600', 'weapon2': '0.962', 'FRAGCOUNT': '0.998', 'DAMAGECOUNT': '1.150', 'weapon4': '1.320', 'weapon3': '12.660'} +[2023-09-14 12:07:32,722][109198] Avg episode rewards: #0: 14.328, #1: 15.196, true rewards: #0: 0.500, #1: 0.500 +[2023-09-14 12:07:32,724][109198] Avg episode reward: 14.762, avg true_objective: 0.500 +[2023-09-14 12:07:32,734][109198] Num frames 16800... +[2023-09-14 12:07:32,961][109198] Num frames 16900... +[2023-09-14 12:07:33,178][109198] Num frames 17000... +[2023-09-14 12:07:33,396][109198] Num frames 17100... +[2023-09-14 12:07:33,638][109198] Num frames 17200... +[2023-09-14 12:07:33,901][109198] Num frames 17300... +[2023-09-14 12:07:34,172][109198] Num frames 17400... +[2023-09-14 12:07:34,481][109198] Num frames 17500... +[2023-09-14 12:07:34,757][109198] Num frames 17600... +[2023-09-14 12:07:35,008][109198] Num frames 17700... +[2023-09-14 12:07:35,238][109198] Num frames 17800... +[2023-09-14 12:07:35,496][109198] Num frames 17900... +[2023-09-14 12:07:35,766][109198] Num frames 18000... +[2023-09-14 12:07:36,041][109198] Num frames 18100... +[2023-09-14 12:07:36,292][109198] Num frames 18200... +[2023-09-14 12:07:36,526][109198] Num frames 18300... +[2023-09-14 12:07:36,759][109198] Num frames 18400... +[2023-09-14 12:07:37,000][109198] Num frames 18500... +[2023-09-14 12:07:37,235][109198] Num frames 18600... +[2023-09-14 12:07:37,512][109198] Num frames 18700... +[2023-09-14 12:07:37,752][109198] Num frames 18800... +[2023-09-14 12:07:38,000][109198] Num frames 18900... +[2023-09-14 12:07:38,280][109198] Num frames 19000... +[2023-09-14 12:07:38,560][109198] Num frames 19100... +[2023-09-14 12:07:38,831][109198] Num frames 19200... +[2023-09-14 12:07:39,072][109198] Num frames 19300... +[2023-09-14 12:07:39,336][109198] Num frames 19400... +[2023-09-14 12:07:39,591][109198] Num frames 19500... +[2023-09-14 12:07:39,844][109198] Num frames 19600... +[2023-09-14 12:07:40,108][109198] Num frames 19700... +[2023-09-14 12:07:40,379][109198] Num frames 19800... +[2023-09-14 12:07:40,629][109198] Num frames 19900... +[2023-09-14 12:07:40,902][109198] Num frames 20000... +[2023-09-14 12:07:41,200][109198] Num frames 20100... +[2023-09-14 12:07:41,456][109198] Num frames 20200... +[2023-09-14 12:07:41,734][109198] Num frames 20300... +[2023-09-14 12:07:41,985][109198] Num frames 20400... +[2023-09-14 12:07:42,247][109198] Num frames 20500... +[2023-09-14 12:07:42,493][109198] Num frames 20600... +[2023-09-14 12:07:42,728][109198] Num frames 20700... +[2023-09-14 12:07:43,004][109198] Num frames 20800... +[2023-09-14 12:07:43,250][109198] Num frames 20900... +[2023-09-14 12:07:43,508][109198] Num frames 21000... +[2023-09-14 12:07:43,764][109198] Num frames 21100... +[2023-09-14 12:07:44,076][109198] Num frames 21200... +[2023-09-14 12:07:44,396][109198] Num frames 21300... +[2023-09-14 12:07:44,674][109198] Num frames 21400... +[2023-09-14 12:07:44,927][109198] Num frames 21500... +[2023-09-14 12:07:45,160][109198] Num frames 21600... +[2023-09-14 12:07:45,444][109198] Num frames 21700... +[2023-09-14 12:07:45,695][109198] Num frames 21800... +[2023-09-14 12:07:45,948][109198] Num frames 21900... +[2023-09-14 12:07:46,196][109198] Num frames 22000... +[2023-09-14 12:07:46,439][109198] Num frames 22100... +[2023-09-14 12:07:46,688][109198] Num frames 22200... +[2023-09-14 12:07:46,978][109198] Num frames 22300... +[2023-09-14 12:07:47,238][109198] Num frames 22400... +[2023-09-14 12:07:47,500][109198] Num frames 22500... +[2023-09-14 12:07:47,748][109198] Num frames 22600... +[2023-09-14 12:07:47,993][109198] Num frames 22700... +[2023-09-14 12:07:48,305][109198] Num frames 22800... +[2023-09-14 12:07:48,541][109198] Num frames 22900... +[2023-09-14 12:07:48,804][109198] Num frames 23000... +[2023-09-14 12:07:49,052][109198] Num frames 23100... +[2023-09-14 12:07:49,337][109198] Num frames 23200... +[2023-09-14 12:07:49,587][109198] Num frames 23300... +[2023-09-14 12:07:49,835][109198] Num frames 23400... +[2023-09-14 12:07:50,093][109198] Num frames 23500... +[2023-09-14 12:07:50,348][109198] Num frames 23600... +[2023-09-14 12:07:50,604][109198] Num frames 23700... +[2023-09-14 12:07:50,859][109198] Num frames 23800... +[2023-09-14 12:07:51,105][109198] Num frames 23900... +[2023-09-14 12:07:51,420][109198] Num frames 24000... +[2023-09-14 12:07:51,725][109198] Num frames 24100... +[2023-09-14 12:07:51,963][109198] Num frames 24200... +[2023-09-14 12:07:52,231][109198] Num frames 24300... +[2023-09-14 12:07:52,487][109198] Num frames 24400... +[2023-09-14 12:07:52,753][109198] Num frames 24500... +[2023-09-14 12:07:53,000][109198] Num frames 24600... +[2023-09-14 12:07:53,251][109198] Num frames 24700... +[2023-09-14 12:07:53,501][109198] Num frames 24800... +[2023-09-14 12:07:53,744][109198] Num frames 24900... +[2023-09-14 12:07:53,985][109198] Num frames 25000... +[2023-09-14 12:07:54,234][109198] Num frames 25100... +[2023-09-14 12:07:54,516][109198] DAMAGECOUNT value on done: 235.0 +[2023-09-14 12:07:54,516][109198] DAMAGECOUNT value on done: 330.0 +[2023-09-14 12:07:54,518][109198] Sum rewards: 7.895, reward structure: {'HEALTH': '-0.350', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO3': '0.025', 'WEAPON3': '0.200', 'DAMAGECOUNT': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.894', 'weapon3': '4.356'} +[2023-09-14 12:07:54,582][109198] Avg episode rewards: #0: 12.971, #1: 12.762, true rewards: #0: 0.333, #1: 0.667 +[2023-09-14 12:07:54,584][109198] Avg episode reward: 12.867, avg true_objective: 0.500 +[2023-09-14 12:07:54,595][109198] Num frames 25200... +[2023-09-14 12:07:54,887][109198] Num frames 25300... +[2023-09-14 12:07:55,119][109198] Num frames 25400... +[2023-09-14 12:07:55,378][109198] Num frames 25500... +[2023-09-14 12:07:55,655][109198] Num frames 25600... +[2023-09-14 12:07:55,902][109198] Num frames 25700... +[2023-09-14 12:07:56,163][109198] Num frames 25800... +[2023-09-14 12:07:56,398][109198] Num frames 25900... +[2023-09-14 12:07:56,660][109198] Num frames 26000... +[2023-09-14 12:07:56,911][109198] Num frames 26100... +[2023-09-14 12:07:57,173][109198] Num frames 26200... +[2023-09-14 12:07:57,474][109198] Num frames 26300... +[2023-09-14 12:07:57,712][109198] Num frames 26400... +[2023-09-14 12:07:57,981][109198] Num frames 26500... +[2023-09-14 12:07:58,232][109198] Num frames 26600... +[2023-09-14 12:07:58,511][109198] Num frames 26700... +[2023-09-14 12:07:58,776][109198] Num frames 26800... +[2023-09-14 12:07:59,025][109198] Num frames 26900... +[2023-09-14 12:07:59,304][109198] Num frames 27000... +[2023-09-14 12:07:59,538][109198] Num frames 27100... +[2023-09-14 12:07:59,781][109198] Num frames 27200... +[2023-09-14 12:08:00,022][109198] Num frames 27300... +[2023-09-14 12:08:00,276][109198] Num frames 27400... +[2023-09-14 12:08:00,530][109198] Num frames 27500... +[2023-09-14 12:08:00,796][109198] Num frames 27600... +[2023-09-14 12:08:01,037][109198] Num frames 27700... +[2023-09-14 12:08:01,308][109198] Num frames 27800... +[2023-09-14 12:08:01,540][109198] Num frames 27900... +[2023-09-14 12:08:01,794][109198] Num frames 28000... +[2023-09-14 12:08:02,035][109198] Num frames 28100... +[2023-09-14 12:08:02,292][109198] Num frames 28200... +[2023-09-14 12:08:02,585][109198] Num frames 28300... +[2023-09-14 12:08:02,828][109198] Num frames 28400... +[2023-09-14 12:08:03,081][109198] Num frames 28500... +[2023-09-14 12:08:03,348][109198] Num frames 28600... +[2023-09-14 12:08:03,590][109198] Num frames 28700... +[2023-09-14 12:08:03,834][109198] Num frames 28800... +[2023-09-14 12:08:04,075][109198] Num frames 28900... +[2023-09-14 12:08:04,377][109198] Num frames 29000... +[2023-09-14 12:08:04,676][109198] Num frames 29100... +[2023-09-14 12:08:04,924][109198] Num frames 29200... +[2023-09-14 12:08:05,149][109198] Num frames 29300... +[2023-09-14 12:08:05,413][109198] Num frames 29400... +[2023-09-14 12:08:05,643][109198] Num frames 29500... +[2023-09-14 12:08:05,892][109198] Num frames 29600... +[2023-09-14 12:08:06,135][109198] Num frames 29700... +[2023-09-14 12:08:06,365][109198] Num frames 29800... +[2023-09-14 12:08:06,598][109198] Num frames 29900... +[2023-09-14 12:08:06,827][109198] Num frames 30000... +[2023-09-14 12:08:07,096][109198] Num frames 30100... +[2023-09-14 12:08:07,347][109198] Num frames 30200... +[2023-09-14 12:08:07,614][109198] Num frames 30300... +[2023-09-14 12:08:07,833][109198] Num frames 30400... +[2023-09-14 12:08:08,095][109198] Num frames 30500... +[2023-09-14 12:08:08,380][109198] Num frames 30600... +[2023-09-14 12:08:08,646][109198] Num frames 30700... +[2023-09-14 12:08:08,911][109198] Num frames 30800... +[2023-09-14 12:08:09,189][109198] Num frames 30900... +[2023-09-14 12:08:09,451][109198] Num frames 31000... +[2023-09-14 12:08:09,704][109198] Num frames 31100... +[2023-09-14 12:08:09,934][109198] Num frames 31200... +[2023-09-14 12:08:10,179][109198] Num frames 31300... +[2023-09-14 12:08:10,413][109198] Num frames 31400... +[2023-09-14 12:08:10,639][109198] Num frames 31500... +[2023-09-14 12:08:10,902][109198] Num frames 31600... +[2023-09-14 12:08:11,163][109198] Num frames 31700... +[2023-09-14 12:08:11,440][109198] Num frames 31800... +[2023-09-14 12:08:11,668][109198] Num frames 31900... +[2023-09-14 12:08:11,931][109198] Num frames 32000... +[2023-09-14 12:08:12,190][109198] Num frames 32100... +[2023-09-14 12:08:12,434][109198] Num frames 32200... +[2023-09-14 12:08:12,691][109198] Num frames 32300... +[2023-09-14 12:08:12,953][109198] Num frames 32400... +[2023-09-14 12:08:13,224][109198] Num frames 32500... +[2023-09-14 12:08:13,486][109198] Num frames 32600... +[2023-09-14 12:08:13,743][109198] Num frames 32700... +[2023-09-14 12:08:14,014][109198] Num frames 32800... +[2023-09-14 12:08:14,307][109198] Num frames 32900... +[2023-09-14 12:08:14,577][109198] Num frames 33000... +[2023-09-14 12:08:14,861][109198] Num frames 33100... +[2023-09-14 12:08:15,109][109198] Num frames 33200... +[2023-09-14 12:08:15,385][109198] Num frames 33300... +[2023-09-14 12:08:15,635][109198] Num frames 33400... +[2023-09-14 12:08:15,897][109198] Num frames 33500... +[2023-09-14 12:08:16,129][109198] DAMAGECOUNT value on done: 375.0 +[2023-09-14 12:08:16,130][109198] DAMAGECOUNT value on done: 380.0 +[2023-09-14 12:08:16,132][109198] Sum rewards: 11.747, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.019', 'AMMO3': '0.020', 'AMMO4': '0.096', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.368', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.400', 'weapon2': '1.622', 'weapon4': '2.212', 'weapon3': '6.508'} +[2023-09-14 12:08:16,201][109198] Avg episode rewards: #0: 12.665, #1: 13.072, true rewards: #0: 0.250, #1: 0.500 +[2023-09-14 12:08:16,203][109198] Avg episode reward: 12.869, avg true_objective: 0.375 +[2023-09-14 12:08:16,225][109198] Num frames 33600... +[2023-09-14 12:08:16,500][109198] Num frames 33700... +[2023-09-14 12:08:16,778][109198] Num frames 33800... +[2023-09-14 12:08:17,044][109198] Num frames 33900... +[2023-09-14 12:08:17,311][109198] Num frames 34000... +[2023-09-14 12:08:17,589][109198] Num frames 34100... +[2023-09-14 12:08:17,846][109198] Num frames 34200... +[2023-09-14 12:08:18,115][109198] Num frames 34300... +[2023-09-14 12:08:18,424][109198] Num frames 34400... +[2023-09-14 12:08:18,685][109198] Num frames 34500... +[2023-09-14 12:08:18,949][109198] Num frames 34600... +[2023-09-14 12:08:19,229][109198] Num frames 34700... +[2023-09-14 12:08:19,508][109198] Num frames 34800... +[2023-09-14 12:08:19,747][109198] Num frames 34900... +[2023-09-14 12:08:19,988][109198] Num frames 35000... +[2023-09-14 12:08:20,244][109198] Num frames 35100... +[2023-09-14 12:08:20,513][109198] Num frames 35200... +[2023-09-14 12:08:20,805][109198] Num frames 35300... +[2023-09-14 12:08:21,049][109198] Num frames 35400... +[2023-09-14 12:08:21,298][109198] Num frames 35500... +[2023-09-14 12:08:21,534][109198] Num frames 35600... +[2023-09-14 12:08:21,797][109198] Num frames 35700... +[2023-09-14 12:08:22,057][109198] Num frames 35800... +[2023-09-14 12:08:22,308][109198] Num frames 35900... +[2023-09-14 12:08:22,560][109198] Num frames 36000... +[2023-09-14 12:08:22,813][109198] Num frames 36100... +[2023-09-14 12:08:23,085][109198] Num frames 36200... +[2023-09-14 12:08:23,358][109198] Num frames 36300... +[2023-09-14 12:08:23,630][109198] Num frames 36400... +[2023-09-14 12:08:23,874][109198] Num frames 36500... +[2023-09-14 12:08:24,115][109198] Num frames 36600... +[2023-09-14 12:08:24,408][109198] Num frames 36700... +[2023-09-14 12:08:24,682][109198] Num frames 36800... +[2023-09-14 12:08:24,949][109198] Num frames 36900... +[2023-09-14 12:08:25,198][109198] Num frames 37000... +[2023-09-14 12:08:25,473][109198] Num frames 37100... +[2023-09-14 12:08:25,730][109198] Num frames 37200... +[2023-09-14 12:08:25,993][109198] Num frames 37300... +[2023-09-14 12:08:26,266][109198] Num frames 37400... +[2023-09-14 12:08:26,545][109198] Num frames 37500... +[2023-09-14 12:08:26,806][109198] Num frames 37600... +[2023-09-14 12:08:27,077][109198] Num frames 37700... +[2023-09-14 12:08:27,320][109198] Num frames 37800... +[2023-09-14 12:08:27,580][109198] Num frames 37900... +[2023-09-14 12:08:27,816][109198] Num frames 38000... +[2023-09-14 12:08:28,073][109198] Num frames 38100... +[2023-09-14 12:08:28,373][109198] Num frames 38200... +[2023-09-14 12:08:28,626][109198] Num frames 38300... +[2023-09-14 12:08:28,863][109198] Num frames 38400... +[2023-09-14 12:08:29,121][109198] Num frames 38500... +[2023-09-14 12:08:29,382][109198] Num frames 38600... +[2023-09-14 12:08:29,639][109198] Num frames 38700... +[2023-09-14 12:08:29,891][109198] Num frames 38800... +[2023-09-14 12:08:30,150][109198] Num frames 38900... +[2023-09-14 12:08:30,403][109198] Num frames 39000... +[2023-09-14 12:08:30,652][109198] Num frames 39100... +[2023-09-14 12:08:30,939][109198] Num frames 39200... +[2023-09-14 12:08:31,260][109198] Num frames 39300... +[2023-09-14 12:08:31,516][109198] Num frames 39400... +[2023-09-14 12:08:31,783][109198] Num frames 39500... +[2023-09-14 12:08:32,026][109198] Num frames 39600... +[2023-09-14 12:08:32,315][109198] Num frames 39700... +[2023-09-14 12:08:32,552][109198] Num frames 39800... +[2023-09-14 12:08:32,812][109198] Num frames 39900... +[2023-09-14 12:08:33,048][109198] Num frames 40000... +[2023-09-14 12:08:33,303][109198] Num frames 40100... +[2023-09-14 12:08:33,566][109198] Num frames 40200... +[2023-09-14 12:08:33,839][109198] Num frames 40300... +[2023-09-14 12:08:34,116][109198] Num frames 40400... +[2023-09-14 12:08:34,434][109198] Num frames 40500... +[2023-09-14 12:08:34,718][109198] Num frames 40600... +[2023-09-14 12:08:34,951][109198] Num frames 40700... +[2023-09-14 12:08:35,194][109198] Num frames 40800... +[2023-09-14 12:08:35,479][109198] Num frames 40900... +[2023-09-14 12:08:35,727][109198] Num frames 41000... +[2023-09-14 12:08:35,997][109198] Num frames 41100... +[2023-09-14 12:08:36,269][109198] Num frames 41200... +[2023-09-14 12:08:36,543][109198] Num frames 41300... +[2023-09-14 12:08:36,798][109198] Num frames 41400... +[2023-09-14 12:08:37,080][109198] Num frames 41500... +[2023-09-14 12:08:37,339][109198] Num frames 41600... +[2023-09-14 12:08:37,657][109198] Num frames 41700... +[2023-09-14 12:08:37,882][109198] Num frames 41800... +[2023-09-14 12:08:38,157][109198] Num frames 41900... +[2023-09-14 12:08:38,425][109198] DAMAGECOUNT value on done: 490.0 +[2023-09-14 12:08:38,425][109198] DAMAGECOUNT value on done: 480.0 +[2023-09-14 12:08:38,426][109198] Sum rewards: 15.714, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO2': '0.023', 'AMMO3': '0.030', 'WEAPON5': '0.100', 'AMMO4': '0.114', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon2': '1.542', 'weapon4': '2.612', 'weapon3': '10.632'} +[2023-09-14 12:08:38,428][109198] Sum rewards: 13.388, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO3': '0.059', 'WEAPON5': '0.200', 'weapon5': '0.426', 'WEAPON3': '0.500', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon2': '2.324', 'weapon3': '11.904'} +[2023-09-14 12:08:38,490][109198] Avg episode rewards: #0: 13.274, #1: 13.135, true rewards: #0: 0.400, #1: 0.400 +[2023-09-14 12:08:38,492][109198] Avg episode reward: 13.205, avg true_objective: 0.400 +[2023-09-14 12:13:05,845][109198] Replay video saved to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/replay.mp4! +[2023-09-14 12:21:42,954][109198] The model has been pushed to https://huggingface.co/MattStammers/vizdoom_duel +[2023-09-14 12:27:49,655][109198] Environment doom_basic already registered, overwriting... +[2023-09-14 12:27:49,659][109198] Environment doom_two_colors_easy already registered, overwriting... +[2023-09-14 12:27:49,660][109198] Environment doom_two_colors_hard already registered, overwriting... +[2023-09-14 12:27:49,662][109198] Environment doom_dm already registered, overwriting... +[2023-09-14 12:27:49,663][109198] Environment doom_dwango5 already registered, overwriting... +[2023-09-14 12:27:49,665][109198] Environment doom_my_way_home_flat_actions already registered, overwriting... +[2023-09-14 12:27:49,666][109198] Environment doom_defend_the_center_flat_actions already registered, overwriting... +[2023-09-14 12:27:49,666][109198] Environment doom_my_way_home already registered, overwriting... +[2023-09-14 12:27:49,667][109198] Environment doom_deadly_corridor already registered, overwriting... +[2023-09-14 12:27:49,668][109198] Environment doom_defend_the_center already registered, overwriting... +[2023-09-14 12:27:49,669][109198] Environment doom_defend_the_line already registered, overwriting... +[2023-09-14 12:27:49,670][109198] Environment doom_health_gathering already registered, overwriting... +[2023-09-14 12:27:49,671][109198] Environment doom_health_gathering_supreme already registered, overwriting... +[2023-09-14 12:27:49,672][109198] Environment doom_battle already registered, overwriting... +[2023-09-14 12:27:49,673][109198] Environment doom_battle2 already registered, overwriting... +[2023-09-14 12:27:49,674][109198] Environment doom_duel_bots already registered, overwriting... +[2023-09-14 12:27:49,676][109198] Environment doom_deathmatch_bots already registered, overwriting... +[2023-09-14 12:27:49,677][109198] Environment doom_duel already registered, overwriting... +[2023-09-14 12:27:49,678][109198] Environment doom_deathmatch_full already registered, overwriting... +[2023-09-14 12:27:49,679][109198] Environment doom_benchmark already registered, overwriting... +[2023-09-14 12:27:49,681][109198] register_encoder_factory: +[2023-09-14 12:27:49,697][109198] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json +[2023-09-14 12:27:49,698][109198] Overriding arg 'train_for_env_steps' with value 10000000 passed from command line +[2023-09-14 12:27:49,703][109198] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists! +[2023-09-14 12:27:49,704][109198] Resuming existing experiment from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment... +[2023-09-14 12:27:49,705][109198] Weights and Biases integration disabled +[2023-09-14 12:27:49,707][109198] Environment var CUDA_VISIBLE_DEVICES is 0,1 + +[2023-09-14 12:27:51,691][109198] Starting experiment with the following configuration: +help=False +algo=APPO +env=doom_duel +experiment=default_experiment +train_dir=/home/cogstack/Documents/optuna/environments/sample_factory/train_dir +restart_behavior=resume +device=gpu +seed=None +num_policies=1 +async_rl=True +serial_mode=False +batched_sampling=False +num_batches_to_accumulate=2 +worker_num_splits=2 +policy_workers_per_policy=1 +max_policy_lag=1000 +num_workers=8 +num_envs_per_worker=4 +batch_size=1024 +num_batches_per_epoch=1 +num_epochs=1 +rollout=32 +recurrence=32 +shuffle_minibatches=False +gamma=0.99 +reward_scale=1.0 +reward_clip=1000.0 +value_bootstrap=False +normalize_returns=True +exploration_loss_coeff=0.001 +value_loss_coeff=0.5 +kl_loss_coeff=0.0 +exploration_loss=symmetric_kl +gae_lambda=0.95 +ppo_clip_ratio=0.1 +ppo_clip_value=0.2 +with_vtrace=False +vtrace_rho=1.0 +vtrace_c=1.0 +optimizer=adam +adam_eps=1e-06 +adam_beta1=0.9 +adam_beta2=0.999 +max_grad_norm=4.0 +learning_rate=0.0001 +lr_schedule=constant +lr_schedule_kl_threshold=0.008 +lr_adaptive_min=1e-06 +lr_adaptive_max=0.01 +obs_subtract_mean=0.0 +obs_scale=255.0 +normalize_input=True +normalize_input_keys=None +decorrelate_experience_max_seconds=0 +decorrelate_envs_on_one_worker=True +actor_worker_gpus=[] +set_workers_cpu_affinity=True +force_envs_single_thread=False +default_niceness=0 +log_to_file=True +experiment_summaries_interval=10 +flush_summaries_interval=30 +stats_avg=100 +summaries_use_frameskip=True +heartbeat_interval=20 +heartbeat_reporting_interval=600 +train_for_env_steps=10000000 +train_for_seconds=10000000000 +save_every_sec=120 +keep_checkpoints=2 +load_checkpoint_kind=latest +save_milestones_sec=-1 +save_best_every_sec=5 +save_best_metric=reward +save_best_after=100000 +benchmark=False +encoder_mlp_layers=[512, 512] +encoder_conv_architecture=convnet_simple +encoder_conv_mlp_layers=[512] +use_rnn=True +rnn_size=512 +rnn_type=gru +rnn_num_layers=1 +decoder_mlp_layers=[] +nonlinearity=elu +policy_initialization=orthogonal +policy_init_gain=1.0 +actor_critic_share_weights=True +adaptive_stddev=True +continuous_tanh_scale=0.0 +initial_stddev=1.0 +use_env_info_cache=False +env_gpu_actions=False +env_gpu_observations=True +env_frameskip=4 +env_framestack=1 +pixel_format=CHW +use_record_episode_statistics=False +with_wandb=False +wandb_user=None +wandb_project=sample_factory +wandb_group=None +wandb_job_type=SF +wandb_tags=[] +with_pbt=False +pbt_mix_policies_in_one_env=True +pbt_period_env_steps=5000000 +pbt_start_mutation=20000000 +pbt_replace_fraction=0.3 +pbt_mutation_rate=0.15 +pbt_replace_reward_gap=0.1 +pbt_replace_reward_gap_absolute=1e-06 +pbt_optimize_gamma=False +pbt_target_objective=true_objective +pbt_perturb_min=1.1 +pbt_perturb_max=1.5 +num_agents=-1 +num_humans=0 +num_bots=-1 +start_bot_difficulty=None +timelimit=None +res_w=128 +res_h=72 +wide_aspect_ratio=False +eval_env_frameskip=1 +fps=35 +command_line=--env=doom_dm --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=20000000 +cli_args={'env': 'doom_dm', 'num_workers': 8, 'num_envs_per_worker': 4, 'train_for_env_steps': 20000000} +git_hash=20b6d44612dad7d171f23e13b1f3b4c5e5631cf9 +git_repo_name=https://github.com/MattStammers/optuna.git +[2023-09-14 12:27:51,693][109198] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... +[2023-09-14 12:27:51,811][109198] Rollout worker 0 uses device cpu +[2023-09-14 12:27:51,812][109198] Rollout worker 1 uses device cpu +[2023-09-14 12:27:51,813][109198] Rollout worker 2 uses device cpu +[2023-09-14 12:27:51,814][109198] Rollout worker 3 uses device cpu +[2023-09-14 12:27:51,815][109198] Rollout worker 4 uses device cpu +[2023-09-14 12:27:51,816][109198] Rollout worker 5 uses device cpu +[2023-09-14 12:27:51,817][109198] Rollout worker 6 uses device cpu +[2023-09-14 12:27:51,818][109198] Rollout worker 7 uses device cpu +[2023-09-14 12:27:51,888][109198] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:27:51,891][109198] InferenceWorker_p0-w0: min num requests: 2 +[2023-09-14 12:27:51,918][109198] Starting all processes... +[2023-09-14 12:27:51,919][109198] Starting process learner_proc0 +[2023-09-14 12:27:53,479][109198] Starting all processes... +[2023-09-14 12:27:53,481][44016] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:27:53,481][44016] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 +[2023-09-14 12:27:53,484][109198] Starting process inference_proc0-0 +[2023-09-14 12:27:53,485][109198] Starting process rollout_proc0 +[2023-09-14 12:27:53,486][109198] Starting process rollout_proc1 +[2023-09-14 12:27:53,486][109198] Starting process rollout_proc2 +[2023-09-14 12:27:53,517][44016] Num visible devices: 1 +[2023-09-14 12:27:53,563][44016] Starting seed is not provided +[2023-09-14 12:27:53,564][44016] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:27:53,564][44016] Initializing actor-critic model on device cuda:0 +[2023-09-14 12:27:53,564][44016] RunningMeanStd input shape: (23,) +[2023-09-14 12:27:53,564][44016] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:27:53,487][109198] Starting process rollout_proc3 +[2023-09-14 12:27:53,565][44016] RunningMeanStd input shape: (1,) +[2023-09-14 12:27:53,487][109198] Starting process rollout_proc4 +[2023-09-14 12:27:53,488][109198] Starting process rollout_proc5 +[2023-09-14 12:27:53,580][44016] ConvEncoder: input_channels=3 +[2023-09-14 12:27:53,488][109198] Starting process rollout_proc6 +[2023-09-14 12:27:53,491][109198] Starting process rollout_proc7 +[2023-09-14 12:27:53,787][44016] Conv encoder output size: 512 +[2023-09-14 12:27:53,788][44016] Policy head output size: 640 +[2023-09-14 12:27:53,819][44016] Created Actor Critic model with architecture: +[2023-09-14 12:27:53,819][44016] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (measurements): RunningMeanStdInPlace() + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): VizdoomEncoder( + (basic_encoder): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ELU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ELU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ELU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ELU) + ) + ) + ) + (measurements_head): Sequential( + (0): Linear(in_features=23, out_features=128, bias=True) + (1): ELU(alpha=1.0) + (2): Linear(in_features=128, out_features=128, bias=True) + (3): ELU(alpha=1.0) + ) + ) + (core): ModelCoreRNN( + (core): GRU(640, 512) + ) + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=41, bias=True) + ) +) +[2023-09-14 12:27:55,107][44016] Using optimizer +[2023-09-14 12:27:55,107][44016] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000248_1015808.pth... +[2023-09-14 12:27:55,135][44016] Loading model from checkpoint +[2023-09-14 12:27:55,140][44016] Loaded experiment state at self.train_step=248, self.env_steps=1015808 +[2023-09-14 12:27:55,141][44016] Initialized policy 0 weights for model version 248 +[2023-09-14 12:27:55,142][44016] LearnerWorker_p0 finished initialization! +[2023-09-14 12:27:55,143][44016] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:27:55,475][44090] Worker 0 uses CPU cores [0, 1, 2, 3] +[2023-09-14 12:27:55,564][44091] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:27:55,564][44091] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 +[2023-09-14 12:27:55,569][44125] Worker 2 uses CPU cores [8, 9, 10, 11] +[2023-09-14 12:27:55,575][44159] Worker 3 uses CPU cores [12, 13, 14, 15] +[2023-09-14 12:27:55,585][44091] Num visible devices: 1 +[2023-09-14 12:27:55,715][44160] Worker 4 uses CPU cores [16, 17, 18, 19] +[2023-09-14 12:27:55,789][44123] Worker 1 uses CPU cores [4, 5, 6, 7] +[2023-09-14 12:27:55,848][44162] Worker 7 uses CPU cores [28, 29, 30, 31] +[2023-09-14 12:27:55,938][44161] Worker 6 uses CPU cores [24, 25, 26, 27] +[2023-09-14 12:27:56,110][44158] Worker 5 uses CPU cores [20, 21, 22, 23] +[2023-09-14 12:27:56,111][109198] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 1015808. Throughput: 0: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:27:56,218][44091] RunningMeanStd input shape: (23,) +[2023-09-14 12:27:56,218][44091] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:27:56,218][44091] RunningMeanStd input shape: (1,) +[2023-09-14 12:27:56,230][44091] ConvEncoder: input_channels=3 +[2023-09-14 12:27:56,333][44091] Conv encoder output size: 512 +[2023-09-14 12:27:56,334][44091] Policy head output size: 640 +[2023-09-14 12:27:56,613][109198] Inference worker 0-0 is ready! +[2023-09-14 12:27:56,615][109198] All inference workers are ready! Signal rollout workers to start! +[2023-09-14 12:27:56,619][44162] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,621][44161] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,621][44125] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,621][44159] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,623][44158] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,623][44123] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,623][44090] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,623][44160] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,650][44162] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:27:56,653][44162] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,654][44159] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:27:56,657][44159] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,671][44161] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:27:56,671][44125] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:27:56,673][44160] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:27:56,673][44090] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:27:56,673][44158] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:27:56,673][44123] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:27:56,676][44161] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,676][44125] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,677][44090] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,677][44160] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,678][44123] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,678][44158] Multi agent env, num agents: 2 +[2023-09-14 12:27:56,682][44162] UDP port 41000 cannot be used [Errno 98] Address already in use +[2023-09-14 12:27:56,683][44162] Port 42000 is available +[2023-09-14 12:27:56,683][44162] Using port 42000 +[2023-09-14 12:27:56,684][44162] Initializing env for player 0, init_info: {'port': 42000}... +[2023-09-14 12:27:56,687][44159] Port 40600 is available +[2023-09-14 12:27:56,687][44159] Using port 40600 +[2023-09-14 12:27:56,688][44159] Initializing env for player 0, init_info: {'port': 40600}... +[2023-09-14 12:27:56,713][44162] Using port 42000 on host... +[2023-09-14 12:27:56,721][44159] Using port 40600 on host... +[2023-09-14 12:27:56,725][44125] Port 40500 is available +[2023-09-14 12:27:56,725][44161] Port 40900 is available +[2023-09-14 12:27:56,725][44125] Using port 40500 +[2023-09-14 12:27:56,725][44161] Using port 40900 +[2023-09-14 12:27:56,726][44090] Port 40300 is available +[2023-09-14 12:27:56,726][44125] Initializing env for player 0, init_info: {'port': 40500}... +[2023-09-14 12:27:56,726][44161] Initializing env for player 0, init_info: {'port': 40900}... +[2023-09-14 12:27:56,726][44090] Using port 40300 +[2023-09-14 12:27:56,727][44160] Port 40700 is available +[2023-09-14 12:27:56,727][44090] Initializing env for player 0, init_info: {'port': 40300}... +[2023-09-14 12:27:56,727][44160] Using port 40700 +[2023-09-14 12:27:56,728][44160] Initializing env for player 0, init_info: {'port': 40700}... +[2023-09-14 12:27:56,730][44158] Port 40800 is available +[2023-09-14 12:27:56,730][44158] Using port 40800 +[2023-09-14 12:27:56,730][44123] Port 40400 is available +[2023-09-14 12:27:56,730][44123] Using port 40400 +[2023-09-14 12:27:56,731][44158] Initializing env for player 0, init_info: {'port': 40800}... +[2023-09-14 12:27:56,731][44123] Initializing env for player 0, init_info: {'port': 40400}... +[2023-09-14 12:27:56,735][44162] Initializing env for player 1, init_info: {'port': 42000}... +[2023-09-14 12:27:56,739][44159] Initializing env for player 1, init_info: {'port': 40600}... +[2023-09-14 12:27:56,760][44123] Using port 40400 on host... +[2023-09-14 12:27:56,761][44161] Using port 40900 on host... +[2023-09-14 12:27:56,761][44125] Using port 40500 on host... +[2023-09-14 12:27:56,761][44158] Using port 40800 on host... +[2023-09-14 12:27:56,775][44090] Using port 40300 on host... +[2023-09-14 12:27:56,776][44160] Using port 40700 on host... +[2023-09-14 12:27:56,776][44161] Initializing env for player 1, init_info: {'port': 40900}... +[2023-09-14 12:27:56,777][44125] Initializing env for player 1, init_info: {'port': 40500}... +[2023-09-14 12:27:56,781][44158] Initializing env for player 1, init_info: {'port': 40800}... +[2023-09-14 12:27:56,781][44123] Initializing env for player 1, init_info: {'port': 40400}... +[2023-09-14 12:27:56,782][44160] Initializing env for player 1, init_info: {'port': 40700}... +[2023-09-14 12:27:56,782][44090] Initializing env for player 1, init_info: {'port': 40300}... +[2023-09-14 12:27:57,880][44159] Initialized w:3 v:0 player:1 +[2023-09-14 12:27:57,880][44159] Initialized w:3 v:0 player:0 +[2023-09-14 12:27:57,880][44162] Initialized w:7 v:0 player:1 +[2023-09-14 12:27:57,881][44162] Initialized w:7 v:0 player:0 +[2023-09-14 12:27:57,881][44090] Initialized w:0 v:0 player:1 +[2023-09-14 12:27:57,882][44159] 2 agent workers initialized for env 3! +[2023-09-14 12:27:57,881][44090] Initialized w:0 v:0 player:0 +[2023-09-14 12:27:57,882][44162] 2 agent workers initialized for env 7! +[2023-09-14 12:27:57,883][44090] 2 agent workers initialized for env 0! +[2023-09-14 12:27:57,891][44159] Decorrelating experience for 0 frames... +[2023-09-14 12:27:57,892][44162] Decorrelating experience for 0 frames... +[2023-09-14 12:27:57,892][44159] Port 40601 is available +[2023-09-14 12:27:57,892][44159] Using port 40601 +[2023-09-14 12:27:57,893][44162] UDP port 41001 cannot be used [Errno 98] Address already in use +[2023-09-14 12:27:57,893][44162] Port 42001 is available +[2023-09-14 12:27:57,893][44162] Using port 42001 +[2023-09-14 12:27:57,894][44090] Decorrelating experience for 0 frames... +[2023-09-14 12:27:57,894][44125] Initialized w:2 v:0 player:0 +[2023-09-14 12:27:57,895][44090] Port 40301 is available +[2023-09-14 12:27:57,895][44090] Using port 40301 +[2023-09-14 12:27:57,895][44125] Initialized w:2 v:0 player:1 +[2023-09-14 12:27:57,896][44090] Initializing env for player 0, init_info: {'port': 40301}... +[2023-09-14 12:27:57,897][44125] 2 agent workers initialized for env 2! +[2023-09-14 12:27:57,906][44125] Decorrelating experience for 0 frames... +[2023-09-14 12:27:57,907][44125] Port 40501 is available +[2023-09-14 12:27:57,908][44125] Using port 40501 +[2023-09-14 12:27:57,909][44125] Initializing env for player 0, init_info: {'port': 40501}... +[2023-09-14 12:27:57,924][44161] Initialized w:6 v:0 player:0 +[2023-09-14 12:27:57,925][44161] Initialized w:6 v:0 player:1 +[2023-09-14 12:27:57,925][44158] Initialized w:5 v:0 player:0 +[2023-09-14 12:27:57,925][44160] Initialized w:4 v:0 player:1 +[2023-09-14 12:27:57,926][44158] Initialized w:5 v:0 player:1 +[2023-09-14 12:27:57,926][44160] Initialized w:4 v:0 player:0 +[2023-09-14 12:27:57,926][44161] 2 agent workers initialized for env 6! +[2023-09-14 12:27:57,927][44158] 2 agent workers initialized for env 5! +[2023-09-14 12:27:57,927][44090] Using port 40301 on host... +[2023-09-14 12:27:57,927][44160] 2 agent workers initialized for env 4! +[2023-09-14 12:27:57,937][44160] Decorrelating experience for 0 frames... +[2023-09-14 12:27:57,937][44161] Decorrelating experience for 0 frames... +[2023-09-14 12:27:57,937][44158] Decorrelating experience for 0 frames... +[2023-09-14 12:27:57,938][44160] Port 40701 is available +[2023-09-14 12:27:57,938][44160] Using port 40701 +[2023-09-14 12:27:57,938][44158] Port 40801 is available +[2023-09-14 12:27:57,938][44158] Using port 40801 +[2023-09-14 12:27:57,938][44160] Initializing env for player 0, init_info: {'port': 40701}... +[2023-09-14 12:27:57,938][44161] Port 40901 is available +[2023-09-14 12:27:57,939][44161] Using port 40901 +[2023-09-14 12:27:57,939][44158] Initializing env for player 0, init_info: {'port': 40801}... +[2023-09-14 12:27:57,939][44161] Initializing env for player 0, init_info: {'port': 40901}... +[2023-09-14 12:27:57,944][44159] Initializing env for player 0, init_info: {'port': 40601}... +[2023-09-14 12:27:57,946][44125] Using port 40501 on host... +[2023-09-14 12:27:57,947][44090] Initializing env for player 1, init_info: {'port': 40301}... +[2023-09-14 12:27:57,950][44123] Initialized w:1 v:0 player:1 +[2023-09-14 12:27:57,950][44123] Initialized w:1 v:0 player:0 +[2023-09-14 12:27:57,952][44123] 2 agent workers initialized for env 1! +[2023-09-14 12:27:57,959][44125] Initializing env for player 1, init_info: {'port': 40501}... +[2023-09-14 12:27:57,962][44123] Decorrelating experience for 0 frames... +[2023-09-14 12:27:57,963][44123] Port 40401 is available +[2023-09-14 12:27:57,963][44123] Using port 40401 +[2023-09-14 12:27:57,968][44160] Using port 40701 on host... +[2023-09-14 12:27:57,971][44158] Using port 40801 on host... +[2023-09-14 12:27:57,979][44159] Using port 40601 on host... +[2023-09-14 12:27:57,980][44161] Using port 40901 on host... +[2023-09-14 12:27:57,989][44160] Initializing env for player 1, init_info: {'port': 40701}... +[2023-09-14 12:27:57,990][44161] Initializing env for player 1, init_info: {'port': 40901}... +[2023-09-14 12:27:57,991][44158] Initializing env for player 1, init_info: {'port': 40801}... +[2023-09-14 12:27:57,994][44159] Initializing env for player 1, init_info: {'port': 40601}... +[2023-09-14 12:27:58,988][44090] Initialized w:0 v:1 player:1 +[2023-09-14 12:27:58,989][44090] Initialized w:0 v:1 player:0 +[2023-09-14 12:27:58,991][44090] 2 agent workers initialized for env 0! +[2023-09-14 12:27:58,998][44090] Decorrelating experience for 32 frames... +[2023-09-14 12:27:59,058][44090] Multi agent env, num agents: 2 +[2023-09-14 12:27:59,069][44159] Initialized w:3 v:1 player:0 +[2023-09-14 12:27:59,070][44161] Initialized w:6 v:1 player:1 +[2023-09-14 12:27:59,069][44159] Initialized w:3 v:1 player:1 +[2023-09-14 12:27:59,072][44158] Initialized w:5 v:1 player:0 +[2023-09-14 12:27:59,073][44159] 2 agent workers initialized for env 3! +[2023-09-14 12:27:59,073][44158] Initialized w:5 v:1 player:1 +[2023-09-14 12:27:59,074][44158] 2 agent workers initialized for env 5! +[2023-09-14 12:27:59,083][44159] Decorrelating experience for 32 frames... +[2023-09-14 12:27:59,084][44158] Decorrelating experience for 32 frames... +[2023-09-14 12:27:59,097][44090] Multi agent env, num agents: 2 +[2023-09-14 12:27:59,106][44162] Initializing env for player 0, init_info: {'port': 42001}... +[2023-09-14 12:27:59,127][44090] Port 40302 is available +[2023-09-14 12:27:59,127][44090] Using port 40302 +[2023-09-14 12:27:59,128][44090] Initializing env for player 0, init_info: {'port': 40302}... +[2023-09-14 12:27:59,136][44125] Initialized w:2 v:1 player:1 +[2023-09-14 12:27:59,143][44162] Using port 42001 on host... +[2023-09-14 12:27:59,146][44125] Initialized w:2 v:1 player:0 +[2023-09-14 12:27:59,147][44125] 2 agent workers initialized for env 2! +[2023-09-14 12:27:59,156][44162] Initializing env for player 1, init_info: {'port': 42001}... +[2023-09-14 12:27:59,158][44125] Decorrelating experience for 32 frames... +[2023-09-14 12:27:59,167][44158] Multi agent env, num agents: 2 +[2023-09-14 12:27:59,172][44090] Using port 40302 on host... +[2023-09-14 12:27:59,174][44160] Initialized w:4 v:1 player:1 +[2023-09-14 12:27:59,174][44160] Initialized w:4 v:1 player:0 +[2023-09-14 12:27:59,175][44160] 2 agent workers initialized for env 4! +[2023-09-14 12:27:59,178][44123] Initializing env for player 0, init_info: {'port': 40401}... +[2023-09-14 12:27:59,178][44090] Initializing env for player 1, init_info: {'port': 40302}... +[2023-09-14 12:27:59,183][44159] Multi agent env, num agents: 2 +[2023-09-14 12:27:59,184][44160] Decorrelating experience for 32 frames... +[2023-09-14 12:27:59,213][44158] Multi agent env, num agents: 2 +[2023-09-14 12:27:59,224][44123] Using port 40401 on host... +[2023-09-14 12:27:59,229][44159] Multi agent env, num agents: 2 +[2023-09-14 12:27:59,232][44123] Initializing env for player 1, init_info: {'port': 40401}... +[2023-09-14 12:27:59,237][44125] Multi agent env, num agents: 2 +[2023-09-14 12:27:59,259][44158] Port 40802 is available +[2023-09-14 12:27:59,259][44158] Using port 40802 +[2023-09-14 12:27:59,259][44158] Initializing env for player 0, init_info: {'port': 40802}... +[2023-09-14 12:27:59,263][44160] Multi agent env, num agents: 2 +[2023-09-14 12:27:59,275][44159] Port 40602 is available +[2023-09-14 12:27:59,275][44159] Using port 40602 +[2023-09-14 12:27:59,275][44159] Initializing env for player 0, init_info: {'port': 40602}... +[2023-09-14 12:27:59,284][44125] Multi agent env, num agents: 2 +[2023-09-14 12:27:59,304][44158] Using port 40802 on host... +[2023-09-14 12:27:59,309][44160] Multi agent env, num agents: 2 +[2023-09-14 12:27:59,312][44158] Initializing env for player 1, init_info: {'port': 40802}... +[2023-09-14 12:27:59,320][44159] Using port 40602 on host... +[2023-09-14 12:27:59,328][44159] Initializing env for player 1, init_info: {'port': 40602}... +[2023-09-14 12:27:59,329][44125] Port 40502 is available +[2023-09-14 12:27:59,329][44125] Using port 40502 +[2023-09-14 12:27:59,330][44125] Initializing env for player 0, init_info: {'port': 40502}... +[2023-09-14 12:27:59,355][44160] Port 40702 is available +[2023-09-14 12:27:59,355][44160] Using port 40702 +[2023-09-14 12:27:59,365][44125] Using port 40502 on host... +[2023-09-14 12:27:59,380][44125] Initializing env for player 1, init_info: {'port': 40502}... +[2023-09-14 12:27:59,707][109198] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 1015808. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:28:00,069][44161] Initialized w:6 v:1 player:0 +[2023-09-14 12:28:00,070][44161] 2 agent workers initialized for env 6! +[2023-09-14 12:28:00,085][44161] Decorrelating experience for 32 frames... +[2023-09-14 12:28:00,151][44161] Multi agent env, num agents: 2 +[2023-09-14 12:28:00,181][44161] Multi agent env, num agents: 2 +[2023-09-14 12:28:00,209][44161] Port 40902 is available +[2023-09-14 12:28:00,209][44161] Using port 40902 +[2023-09-14 12:28:00,210][44161] Initializing env for player 0, init_info: {'port': 40902}... +[2023-09-14 12:28:00,244][44161] Using port 40902 on host... +[2023-09-14 12:28:00,245][44090] Initialized w:0 v:2 player:0 +[2023-09-14 12:28:00,245][44090] Initialized w:0 v:2 player:1 +[2023-09-14 12:28:00,247][44090] 2 agent workers initialized for env 0! +[2023-09-14 12:28:00,252][44162] Initialized w:7 v:1 player:0 +[2023-09-14 12:28:00,253][44162] Initialized w:7 v:1 player:1 +[2023-09-14 12:28:00,254][44162] 2 agent workers initialized for env 7! +[2023-09-14 12:28:00,256][44090] Decorrelating experience for 64 frames... +[2023-09-14 12:28:00,260][44161] Initializing env for player 1, init_info: {'port': 40902}... +[2023-09-14 12:28:00,267][44162] Decorrelating experience for 32 frames... +[2023-09-14 12:28:00,333][44162] Multi agent env, num agents: 2 +[2023-09-14 12:28:00,362][44162] Multi agent env, num agents: 2 +[2023-09-14 12:28:00,367][44090] Port 40303 is available +[2023-09-14 12:28:00,367][44090] Using port 40303 +[2023-09-14 12:28:00,390][44162] UDP port 41002 cannot be used [Errno 98] Address already in use +[2023-09-14 12:28:00,390][44162] Port 42002 is available +[2023-09-14 12:28:00,390][44162] Using port 42002 +[2023-09-14 12:28:00,391][44162] Initializing env for player 0, init_info: {'port': 42002}... +[2023-09-14 12:28:00,410][44123] Initialized w:1 v:1 player:1 +[2023-09-14 12:28:00,411][44123] Initialized w:1 v:1 player:0 +[2023-09-14 12:28:00,412][44123] 2 agent workers initialized for env 1! +[2023-09-14 12:28:00,417][44158] Initialized w:5 v:2 player:1 +[2023-09-14 12:28:00,418][44158] Initialized w:5 v:2 player:0 +[2023-09-14 12:28:00,418][44090] Initializing env for player 0, init_info: {'port': 40303}... +[2023-09-14 12:28:00,420][44158] 2 agent workers initialized for env 5! +[2023-09-14 12:28:00,426][44162] Using port 42002 on host... +[2023-09-14 12:28:00,428][44123] Decorrelating experience for 32 frames... +[2023-09-14 12:28:00,431][44158] Decorrelating experience for 64 frames... +[2023-09-14 12:28:00,432][44125] Initialized w:2 v:2 player:1 +[2023-09-14 12:28:00,433][44125] Initialized w:2 v:2 player:0 +[2023-09-14 12:28:00,435][44125] 2 agent workers initialized for env 2! +[2023-09-14 12:28:00,441][44162] Initializing env for player 1, init_info: {'port': 42002}... +[2023-09-14 12:28:00,445][44125] Decorrelating experience for 64 frames... +[2023-09-14 12:28:00,454][44090] Using port 40303 on host... +[2023-09-14 12:28:00,467][44160] Initializing env for player 0, init_info: {'port': 40702}... +[2023-09-14 12:28:00,471][44090] Initializing env for player 1, init_info: {'port': 40303}... +[2023-09-14 12:28:00,509][44123] Multi agent env, num agents: 2 +[2023-09-14 12:28:00,514][44159] Initialized w:3 v:2 player:0 +[2023-09-14 12:28:00,515][44159] Initialized w:3 v:2 player:1 +[2023-09-14 12:28:00,516][44160] Using port 40702 on host... +[2023-09-14 12:28:00,516][44159] 2 agent workers initialized for env 3! +[2023-09-14 12:28:00,526][44160] Initializing env for player 1, init_info: {'port': 40702}... +[2023-09-14 12:28:00,527][44159] Decorrelating experience for 64 frames... +[2023-09-14 12:28:00,546][44123] Multi agent env, num agents: 2 +[2023-09-14 12:28:00,583][44123] Port 40402 is available +[2023-09-14 12:28:00,583][44123] Using port 40402 +[2023-09-14 12:28:00,584][44123] Initializing env for player 0, init_info: {'port': 40402}... +[2023-09-14 12:28:00,587][44125] Port 40503 is available +[2023-09-14 12:28:00,587][44125] Using port 40503 +[2023-09-14 12:28:00,587][44125] Initializing env for player 0, init_info: {'port': 40503}... +[2023-09-14 12:28:00,589][44158] Port 40803 is available +[2023-09-14 12:28:00,589][44158] Using port 40803 +[2023-09-14 12:28:00,590][44158] Initializing env for player 0, init_info: {'port': 40803}... +[2023-09-14 12:28:00,612][44123] Using port 40402 on host... +[2023-09-14 12:28:00,616][44125] Using port 40503 on host... +[2023-09-14 12:28:00,618][44158] Using port 40803 on host... +[2023-09-14 12:28:00,634][44123] Initializing env for player 1, init_info: {'port': 40402}... +[2023-09-14 12:28:00,638][44125] Initializing env for player 1, init_info: {'port': 40503}... +[2023-09-14 12:28:00,640][44158] Initializing env for player 1, init_info: {'port': 40803}... +[2023-09-14 12:28:00,678][44159] Port 40603 is available +[2023-09-14 12:28:00,678][44159] Using port 40603 +[2023-09-14 12:28:00,679][44159] Initializing env for player 0, init_info: {'port': 40603}... +[2023-09-14 12:28:00,708][44159] Using port 40603 on host... +[2023-09-14 12:28:00,729][44159] Initializing env for player 1, init_info: {'port': 40603}... +[2023-09-14 12:28:01,308][44161] Initialized w:6 v:2 player:1 +[2023-09-14 12:28:01,308][44161] Initialized w:6 v:2 player:0 +[2023-09-14 12:28:01,310][44161] 2 agent workers initialized for env 6! +[2023-09-14 12:28:01,319][44161] Decorrelating experience for 64 frames... +[2023-09-14 12:28:01,459][44161] Port 40903 is available +[2023-09-14 12:28:01,460][44161] Using port 40903 +[2023-09-14 12:28:01,556][44162] Initialized w:7 v:2 player:0 +[2023-09-14 12:28:01,556][44162] Initialized w:7 v:2 player:1 +[2023-09-14 12:28:01,558][44162] 2 agent workers initialized for env 7! +[2023-09-14 12:28:01,573][44162] Decorrelating experience for 64 frames... +[2023-09-14 12:28:01,636][44160] Initialized w:4 v:2 player:0 +[2023-09-14 12:28:01,637][44160] Initialized w:4 v:2 player:1 +[2023-09-14 12:28:01,638][44160] 2 agent workers initialized for env 4! +[2023-09-14 12:28:01,651][44160] Decorrelating experience for 64 frames... +[2023-09-14 12:28:01,656][44090] Initialized w:0 v:3 player:0 +[2023-09-14 12:28:01,657][44090] Initialized w:0 v:3 player:1 +[2023-09-14 12:28:01,658][44090] 2 agent workers initialized for env 0! +[2023-09-14 12:28:01,666][44090] Decorrelating experience for 96 frames... +[2023-09-14 12:28:01,691][44162] Port 41003 is available +[2023-09-14 12:28:01,691][44162] Using port 41003 +[2023-09-14 12:28:01,691][44162] Initializing env for player 0, init_info: {'port': 41003}... +[2023-09-14 12:28:01,724][44162] Using port 41003 on host... +[2023-09-14 12:28:01,742][44162] Initializing env for player 1, init_info: {'port': 41003}... +[2023-09-14 12:28:01,771][44125] Initialized w:2 v:3 player:0 +[2023-09-14 12:28:01,772][44125] Initialized w:2 v:3 player:1 +[2023-09-14 12:28:01,773][44125] 2 agent workers initialized for env 2! +[2023-09-14 12:28:01,785][44125] Decorrelating experience for 96 frames... +[2023-09-14 12:28:01,788][44158] Initialized w:5 v:3 player:1 +[2023-09-14 12:28:01,790][44158] Initialized w:5 v:3 player:0 +[2023-09-14 12:28:01,790][44158] 2 agent workers initialized for env 5! +[2023-09-14 12:28:01,800][44158] Decorrelating experience for 96 frames... +[2023-09-14 12:28:01,803][44160] Port 40703 is available +[2023-09-14 12:28:01,804][44160] Using port 40703 +[2023-09-14 12:28:01,804][44160] Initializing env for player 0, init_info: {'port': 40703}... +[2023-09-14 12:28:01,813][44123] Initialized w:1 v:2 player:0 +[2023-09-14 12:28:01,813][44123] Initialized w:1 v:2 player:1 +[2023-09-14 12:28:01,814][44123] 2 agent workers initialized for env 1! +[2023-09-14 12:28:01,821][44161] Initializing env for player 0, init_info: {'port': 40903}... +[2023-09-14 12:28:01,823][44123] Decorrelating experience for 64 frames... +[2023-09-14 12:28:01,842][44160] Using port 40703 on host... +[2023-09-14 12:28:01,855][44160] Initializing env for player 1, init_info: {'port': 40703}... +[2023-09-14 12:28:01,857][44161] Using port 40903 on host... +[2023-09-14 12:28:01,871][44161] Initializing env for player 1, init_info: {'port': 40903}... +[2023-09-14 12:28:01,899][44159] Initialized w:3 v:3 player:0 +[2023-09-14 12:28:01,899][44159] Initialized w:3 v:3 player:1 +[2023-09-14 12:28:01,901][44159] 2 agent workers initialized for env 3! +[2023-09-14 12:28:01,911][44159] Decorrelating experience for 96 frames... +[2023-09-14 12:28:01,978][44123] Port 40403 is available +[2023-09-14 12:28:01,979][44123] Using port 40403 +[2023-09-14 12:28:01,980][44123] Initializing env for player 0, init_info: {'port': 40403}... +[2023-09-14 12:28:02,016][44123] Using port 40403 on host... +[2023-09-14 12:28:02,030][44123] Initializing env for player 1, init_info: {'port': 40403}... +[2023-09-14 12:28:02,840][44162] Initialized w:7 v:3 player:1 +[2023-09-14 12:28:02,840][44162] Initialized w:7 v:3 player:0 +[2023-09-14 12:28:02,841][44162] 2 agent workers initialized for env 7! +[2023-09-14 12:28:02,850][44162] Decorrelating experience for 96 frames... +[2023-09-14 12:28:02,902][44160] Initialized w:4 v:3 player:0 +[2023-09-14 12:28:02,903][44160] Initialized w:4 v:3 player:1 +[2023-09-14 12:28:02,904][44160] 2 agent workers initialized for env 4! +[2023-09-14 12:28:02,914][44160] Decorrelating experience for 96 frames... +[2023-09-14 12:28:02,918][44161] Initialized w:6 v:3 player:0 +[2023-09-14 12:28:02,919][44161] Initialized w:6 v:3 player:1 +[2023-09-14 12:28:02,920][44161] 2 agent workers initialized for env 6! +[2023-09-14 12:28:02,930][44161] Decorrelating experience for 96 frames... +[2023-09-14 12:28:03,143][44123] Initialized w:1 v:3 player:0 +[2023-09-14 12:28:03,143][44123] Initialized w:1 v:3 player:1 +[2023-09-14 12:28:03,144][44123] 2 agent workers initialized for env 1! +[2023-09-14 12:28:03,154][44123] Decorrelating experience for 96 frames... +[2023-09-14 12:28:03,164][44016] Signal inference workers to stop experience collection... +[2023-09-14 12:28:03,173][44091] InferenceWorker_p0-w0: stopping experience collection +[2023-09-14 12:28:04,707][109198] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 1015808. Throughput: 0: 100.0. Samples: 860. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:28:06,281][44016] Signal inference workers to resume experience collection... +[2023-09-14 12:28:06,282][44091] InferenceWorker_p0-w0: resuming experience collection +[2023-09-14 12:28:09,707][109198] Fps is (10 sec: 3686.4, 60 sec: 2711.3, 300 sec: 2711.3). Total num frames: 1052672. Throughput: 0: 493.7. Samples: 6712. Policy #0 lag: (min: 0.0, avg: 1.0, max: 3.0) +[2023-09-14 12:28:09,835][44091] Updated weights for policy 0, policy_version 258 (0.0674) +[2023-09-14 12:28:11,882][109198] Heartbeat connected on Batcher_0 +[2023-09-14 12:28:11,885][109198] Heartbeat connected on LearnerWorker_p0 +[2023-09-14 12:28:11,895][109198] Heartbeat connected on InferenceWorker_p0-w0 +[2023-09-14 12:28:11,899][109198] Heartbeat connected on RolloutWorker_w1 +[2023-09-14 12:28:11,901][109198] Heartbeat connected on RolloutWorker_w0 +[2023-09-14 12:28:11,908][109198] Heartbeat connected on RolloutWorker_w2 +[2023-09-14 12:28:11,909][109198] Heartbeat connected on RolloutWorker_w3 +[2023-09-14 12:28:11,914][109198] Heartbeat connected on RolloutWorker_w4 +[2023-09-14 12:28:11,919][109198] Heartbeat connected on RolloutWorker_w7 +[2023-09-14 12:28:11,925][109198] Heartbeat connected on RolloutWorker_w6 +[2023-09-14 12:28:11,926][109198] Heartbeat connected on RolloutWorker_w5 +[2023-09-14 12:28:12,272][44159] Large shaping reward 2.902 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 2.0), ('DAMAGECOUNT', 1.9000000000000001, 190.0), ('weapon5', 0.002)] +[2023-09-14 12:28:12,709][44091] Updated weights for policy 0, policy_version 268 (0.0014) +[2023-09-14 12:28:14,707][109198] Fps is (10 sec: 10649.8, 60 sec: 5726.7, 300 sec: 5726.7). Total num frames: 1122304. Throughput: 0: 1525.2. Samples: 28364. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:28:15,528][44091] Updated weights for policy 0, policy_version 278 (0.0014) +[2023-09-14 12:28:17,064][44158] Large shaping reward 2.602 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 1.0), ('DAMAGECOUNT', 1.6, 160.0), ('weapon5', 0.002)] +[2023-09-14 12:28:18,574][44091] Updated weights for policy 0, policy_version 288 (0.0014) +[2023-09-14 12:28:19,707][109198] Fps is (10 sec: 13926.3, 60 sec: 7464.2, 300 sec: 7464.2). Total num frames: 1191936. Throughput: 0: 1650.1. Samples: 38936. Policy #0 lag: (min: 0.0, avg: 0.9, max: 2.0) +[2023-09-14 12:28:21,259][44125] Large shaping reward 2.642 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 2.0), ('DAMAGECOUNT', 1.9100000000000001, 191.0), ('HEALTH', -0.27, -27.0), ('weapon5', 0.002)] +[2023-09-14 12:28:21,383][44091] Updated weights for policy 0, policy_version 298 (0.0013) +[2023-09-14 12:28:24,200][44091] Updated weights for policy 0, policy_version 308 (0.0013) +[2023-09-14 12:28:24,707][109198] Fps is (10 sec: 14335.9, 60 sec: 8737.3, 300 sec: 8737.3). Total num frames: 1265664. Throughput: 0: 2127.5. Samples: 60840. Policy #0 lag: (min: 0.0, avg: 1.1, max: 2.0) +[2023-09-14 12:28:27,060][44091] Updated weights for policy 0, policy_version 318 (0.0016) +[2023-09-14 12:28:29,707][109198] Fps is (10 sec: 14336.1, 60 sec: 9509.6, 300 sec: 9509.6). Total num frames: 1335296. Throughput: 0: 2431.2. Samples: 81680. Policy #0 lag: (min: 0.0, avg: 1.1, max: 3.0) +[2023-09-14 12:28:29,942][44091] Updated weights for policy 0, policy_version 328 (0.0013) +[2023-09-14 12:28:32,863][44091] Updated weights for policy 0, policy_version 338 (0.0011) +[2023-09-14 12:28:33,098][44161] Large shaping reward 2.600 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 1.0), ('DAMAGECOUNT', 1.6, 160.0)] +[2023-09-14 12:28:34,707][109198] Fps is (10 sec: 14336.1, 60 sec: 10187.9, 300 sec: 10187.9). Total num frames: 1409024. Throughput: 0: 2395.0. Samples: 92440. Policy #0 lag: (min: 0.0, avg: 1.1, max: 3.0) +[2023-09-14 12:28:35,655][44091] Updated weights for policy 0, policy_version 348 (0.0012) +[2023-09-14 12:28:38,492][44091] Updated weights for policy 0, policy_version 358 (0.0011) +[2023-09-14 12:28:39,707][109198] Fps is (10 sec: 14745.7, 60 sec: 10710.6, 300 sec: 10710.6). Total num frames: 1482752. Throughput: 0: 2621.0. Samples: 114268. Policy #0 lag: (min: 0.0, avg: 1.1, max: 3.0) +[2023-09-14 12:28:41,265][44091] Updated weights for policy 0, policy_version 368 (0.0014) +[2023-09-14 12:28:41,291][44159] DAMAGECOUNT value on done: 320.0 +[2023-09-14 12:28:41,292][44159] DAMAGECOUNT value on done: 45.0 +[2023-09-14 12:28:41,292][44159] Sum rewards: 7.206, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.041', 'weapon5': '0.060', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.270', 'WEAPON3': '0.400', 'weapon2': '0.490', 'FRAGCOUNT': '2.000', 'weapon3': '2.566', 'DAMAGECOUNT': '3.200'} +[2023-09-14 12:28:41,293][44159] Sum rewards: 2.054, reward structure: {'HEALTH': '-2.200', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.030', 'AMMO3': '0.063', 'AMMO4': '0.148', 'WEAPON5': '0.200', 'weapon2': '0.216', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.500', 'weapon4': '0.648', 'FRAGCOUNT': '1.000', 'weapon3': '2.688'} +[2023-09-14 12:28:41,427][44125] DAMAGECOUNT value on done: 30.0 +[2023-09-14 12:28:41,428][44125] DAMAGECOUNT value on done: 125.0 +[2023-09-14 12:28:41,429][44125] Sum rewards: 3.839, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.047', 'weapon5': '0.062', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.886', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.250', 'weapon3': '2.046'} +[2023-09-14 12:28:41,872][44159] DAMAGECOUNT value on done: 104.0 +[2023-09-14 12:28:41,872][44159] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:28:41,873][44159] Sum rewards: 3.513, reward structure: {'HEALTH': '-1.090', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.005', 'AMMO4': '0.013', 'AMMO3': '0.049', 'WEAPON4': '0.100', 'weapon5': '0.176', 'WEAPON5': '0.200', 'weapon4': '0.206', 'WEAPON3': '0.400', 'weapon2': '0.696', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.040', 'weapon3': '1.716'} +[2023-09-14 12:28:41,936][44158] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:28:41,937][44158] Sum rewards: 4.013, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.036', 'AMMO3': '0.040', 'weapon5': '0.094', 'AMMO4': '0.178', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon2': '0.266', 'weapon4': '0.368', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.750', 'FRAGCOUNT': '0.999', 'weapon3': '2.474'} +[2023-09-14 12:28:41,937][44158] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:28:41,990][44125] DAMAGECOUNT value on done: 240.0 +[2023-09-14 12:28:41,990][44125] DAMAGECOUNT value on done: 125.0 +[2023-09-14 12:28:41,991][44125] Sum rewards: 4.520, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.019', 'AMMO3': '0.049', 'weapon5': '0.090', 'AMMO4': '0.095', 'WEAPON5': '0.100', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'weapon2': '0.498', 'weapon4': '0.698', 'weapon3': '1.868', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.400'} +[2023-09-14 12:28:41,991][44125] Sum rewards: 3.652, reward structure: {'HEALTH': '-2.300', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.018', 'AMMO3': '0.076', 'weapon4': '0.088', 'AMMO4': '0.090', 'WEAPON4': '0.100', 'weapon2': '0.144', 'WEAPON5': '0.200', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.250', 'FRAGCOUNT': '2.000', 'weapon3': '3.376'} +[2023-09-14 12:28:42,241][44160] DAMAGECOUNT value on done: 385.0 +[2023-09-14 12:28:42,242][44160] DAMAGECOUNT value on done: 145.0 +[2023-09-14 12:28:42,242][44160] Sum rewards: 6.017, reward structure: {'HEALTH': '-2.450', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.032', 'AMMO2': '-0.006', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'weapon5': '0.054', 'AMMO3': '0.070', 'WEAPON5': '0.300', 'weapon2': '0.572', 'WEAPON3': '0.600', 'FRAGCOUNT': '2.000', 'weapon3': '3.044', 'DAMAGECOUNT': '3.850'} +[2023-09-14 12:28:42,243][44160] Sum rewards: 0.791, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.024', 'WEAPON5': '0.100', 'AMMO3': '0.104', 'AMMO4': '0.121', 'weapon2': '0.236', 'WEAPON4': '0.300', 'weapon4': '0.684', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.450', 'weapon3': '2.066'} +[2023-09-14 12:28:42,420][44159] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:28:42,420][44159] DAMAGECOUNT value on done: 289.0 +[2023-09-14 12:28:42,421][44159] Sum rewards: 6.568, reward structure: {'HEALTH': '-1.450', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.033', 'AMMO3': '0.039', 'weapon2': '0.050', 'WEAPON5': '0.100', 'weapon5': '0.140', 'AMMO4': '0.163', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.484', 'FRAGCOUNT': '1.999', 'weapon3': '2.516', 'DAMAGECOUNT': '2.890'} +[2023-09-14 12:28:42,474][44090] DAMAGECOUNT value on done: 65.0 +[2023-09-14 12:28:42,474][44090] DAMAGECOUNT value on done: 35.0 +[2023-09-14 12:28:42,475][44090] Sum rewards: 2.669, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.013', 'AMMO3': '0.040', 'AMMO4': '0.066', 'WEAPON4': '0.100', 'weapon5': '0.100', 'weapon2': '0.106', 'weapon4': '0.154', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.350', 'WEAPON3': '0.400', 'weapon3': '3.132'} +[2023-09-14 12:28:42,515][44158] DAMAGECOUNT value on done: 55.0 +[2023-09-14 12:28:42,516][44158] DAMAGECOUNT value on done: 129.0 +[2023-09-14 12:28:42,516][44158] Sum rewards: 3.987, reward structure: {'HEALTH': '-0.550', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'weapon5': '0.056', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.114', 'WEAPON3': '0.200', 'weapon2': '0.438', 'FRAGCOUNT': '1.000', 'weapon3': '1.216', 'DAMAGECOUNT': '1.290'} +[2023-09-14 12:28:42,564][44125] DAMAGECOUNT value on done: 205.0 +[2023-09-14 12:28:42,564][44125] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:28:42,565][44125] Sum rewards: 4.651, reward structure: {'HEALTH': '-0.850', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'weapon5': '0.054', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.444', 'FRAGCOUNT': '1.000', 'weapon3': '1.500', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:28:42,627][44161] DAMAGECOUNT value on done: 146.0 +[2023-09-14 12:28:42,627][44161] DAMAGECOUNT value on done: 226.0 +[2023-09-14 12:28:42,628][44161] Sum rewards: 2.050, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.023', 'AMMO3': '0.048', 'weapon5': '0.054', 'WEAPON5': '0.100', 'AMMO4': '0.116', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.542', 'weapon2': '0.574', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.460', 'weapon3': '1.630'} +[2023-09-14 12:28:42,628][44161] Sum rewards: 5.782, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.010', 'AMMO3': '0.042', 'weapon5': '0.120', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.702', 'FRAGCOUNT': '2.000', 'weapon3': '2.140', 'DAMAGECOUNT': '2.260'} +[2023-09-14 12:28:42,786][44160] DAMAGECOUNT value on done: 65.0 +[2023-09-14 12:28:42,786][44160] DAMAGECOUNT value on done: 110.0 +[2023-09-14 12:28:42,787][44160] Sum rewards: 3.638, reward structure: {'HEALTH': '-0.650', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.019', 'AMMO4': '0.025', 'weapon2': '0.052', 'weapon5': '0.064', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.392', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '1.228'} +[2023-09-14 12:28:42,931][44159] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:28:42,931][44159] DAMAGECOUNT value on done: 8.0 +[2023-09-14 12:28:42,932][44159] Sum rewards: 4.321, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.007', 'AMMO4': '0.010', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon5': '0.144', 'WEAPON5': '0.200', 'weapon4': '0.220', 'WEAPON3': '0.400', 'weapon2': '0.682', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '2.516'} +[2023-09-14 12:28:43,026][44090] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:28:43,027][44090] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:28:43,062][44158] DAMAGECOUNT value on done: 240.0 +[2023-09-14 12:28:43,063][44158] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:28:43,063][44158] Sum rewards: 4.811, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.018', 'AMMO3': '0.031', 'weapon5': '0.076', 'AMMO4': '0.092', 'weapon2': '0.120', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.556', 'FRAGCOUNT': '1.000', 'weapon3': '1.810', 'DAMAGECOUNT': '2.400'} +[2023-09-14 12:28:43,063][44158] Sum rewards: 3.391, reward structure: {'HEALTH': '-1.250', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.030', 'weapon5': '0.058', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon4': '0.282', 'WEAPON3': '0.300', 'weapon2': '0.744', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.874'} +[2023-09-14 12:28:43,108][44125] DAMAGECOUNT value on done: 280.0 +[2023-09-14 12:28:43,108][44125] DAMAGECOUNT value on done: 125.0 +[2023-09-14 12:28:43,109][44125] Sum rewards: 4.177, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO3': '0.059', 'WEAPON4': '0.100', 'weapon5': '0.144', 'WEAPON5': '0.200', 'weapon4': '0.392', 'weapon2': '0.492', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '2.484', 'DAMAGECOUNT': '2.800'} +[2023-09-14 12:28:43,109][44125] Sum rewards: 1.122, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.014', 'AMMO4': '0.020', 'AMMO3': '0.072', 'weapon5': '0.076', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon2': '0.332', 'weapon4': '0.362', 'WEAPON3': '0.600', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.250', 'weapon3': '2.892'} +[2023-09-14 12:28:43,173][44161] DAMAGECOUNT value on done: 20.0 +[2023-09-14 12:28:43,173][44161] DAMAGECOUNT value on done: 30.0 +[2023-09-14 12:28:43,331][44160] DAMAGECOUNT value on done: 90.0 +[2023-09-14 12:28:43,332][44160] DAMAGECOUNT value on done: 185.0 +[2023-09-14 12:28:43,332][44160] Sum rewards: 2.873, reward structure: {'HEALTH': '-1.650', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.030', 'AMMO3': '0.045', 'weapon5': '0.076', 'weapon4': '0.114', 'AMMO4': '0.148', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.420', 'DAMAGECOUNT': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.982'} +[2023-09-14 12:28:43,333][44160] Sum rewards: 3.811, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.050', 'WEAPON5': '0.100', 'weapon2': '0.118', 'weapon5': '0.178', 'WEAPON4': '0.200', 'WEAPON3': '0.200', 'weapon4': '0.860', 'FRAGCOUNT': '1.000', 'weapon3': '1.322', 'DAMAGECOUNT': '1.850'} +[2023-09-14 12:28:43,564][44090] DAMAGECOUNT value on done: 60.0 +[2023-09-14 12:28:43,564][44090] DAMAGECOUNT value on done: 95.0 +[2023-09-14 12:28:43,611][44158] DAMAGECOUNT value on done: 5.0 +[2023-09-14 12:28:43,612][44158] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:28:43,612][44158] Sum rewards: 3.625, reward structure: {'HEALTH': '-1.580', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.017', 'AMMO2': '-0.003', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO3': '0.039', 'WEAPON4': '0.100', 'weapon5': '0.120', 'WEAPON5': '0.200', 'weapon4': '0.246', 'weapon2': '0.374', 'WEAPON3': '0.400', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '2.740'} +[2023-09-14 12:28:43,745][44161] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:28:43,745][44161] DAMAGECOUNT value on done: 220.0 +[2023-09-14 12:28:43,746][44161] Sum rewards: 3.053, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.047', 'AMMO3': '0.073', 'weapon5': '0.110', 'WEAPON5': '0.200', 'AMMO4': '0.233', 'weapon2': '0.238', 'WEAPON4': '0.300', 'weapon4': '0.350', 'WEAPON3': '0.600', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '2.944'} +[2023-09-14 12:28:43,746][44161] Sum rewards: 4.824, reward structure: {'HEALTH': '-1.580', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.044', 'weapon5': '0.072', 'WEAPON4': '0.100', 'weapon4': '0.198', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.416', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '2.200', 'weapon3': '2.770'} +[2023-09-14 12:28:43,790][44123] DAMAGECOUNT value on done: 10.0 +[2023-09-14 12:28:43,790][44123] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:28:43,791][44123] Sum rewards: 2.451, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.023', 'AMMO3': '0.043', 'DAMAGECOUNT': '0.100', 'AMMO4': '0.114', 'weapon5': '0.116', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon2': '0.292', 'weapon4': '0.394', 'WEAPON3': '0.400', 'weapon3': '2.562'} +[2023-09-14 12:28:43,791][44123] Sum rewards: 0.413, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO3': '0.020', 'AMMO2': '0.021', 'weapon5': '0.070', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.103', 'DAMAGECOUNT': '0.150', 'WEAPON3': '0.200', 'weapon4': '0.252', 'weapon2': '0.442', 'weapon3': '0.952'} +[2023-09-14 12:28:43,921][44160] DAMAGECOUNT value on done: 125.0 +[2023-09-14 12:28:43,921][44160] DAMAGECOUNT value on done: 185.0 +[2023-09-14 12:28:43,922][44160] Sum rewards: 3.261, reward structure: {'HEALTH': '-2.050', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.011', 'AMMO4': '0.052', 'weapon4': '0.054', 'AMMO3': '0.056', 'WEAPON4': '0.100', 'weapon5': '0.128', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'weapon2': '0.748', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.850', 'weapon3': '2.606'} +[2023-09-14 12:28:43,922][44160] Sum rewards: 3.807, reward structure: {'HEALTH': '-1.850', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.028', 'weapon2': '0.032', 'weapon5': '0.034', 'AMMO3': '0.040', 'AMMO4': '0.140', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.324', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.250', 'weapon3': '3.000'} +[2023-09-14 12:28:44,099][44091] Updated weights for policy 0, policy_version 378 (0.0012) +[2023-09-14 12:28:44,103][44162] DAMAGECOUNT value on done: 65.0 +[2023-09-14 12:28:44,104][44162] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:28:44,104][44162] Sum rewards: 4.179, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.023', 'AMMO3': '0.047', 'weapon5': '0.064', 'WEAPON5': '0.100', 'AMMO4': '0.116', 'weapon2': '0.180', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.570', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '2.426'} +[2023-09-14 12:28:44,123][44090] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:28:44,123][44090] DAMAGECOUNT value on done: 90.0 +[2023-09-14 12:28:44,314][44161] DAMAGECOUNT value on done: 110.0 +[2023-09-14 12:28:44,314][44161] DAMAGECOUNT value on done: 90.0 +[2023-09-14 12:28:44,314][44161] Sum rewards: 2.797, reward structure: {'HEALTH': '-1.620', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO3': '0.030', 'weapon5': '0.162', 'WEAPON5': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.968', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.100', 'weapon3': '1.666'} +[2023-09-14 12:28:44,378][44123] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:28:44,379][44123] DAMAGECOUNT value on done: 142.0 +[2023-09-14 12:28:44,379][44123] Sum rewards: 1.290, reward structure: {'HEALTH': '-2.120', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.014', 'weapon5': '0.070', 'AMMO4': '0.070', 'AMMO3': '0.073', 'weapon4': '0.178', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.260', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.750', 'weapon3': '2.986'} +[2023-09-14 12:28:44,380][44123] Sum rewards: 4.469, reward structure: {'HEALTH': '-0.750', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'weapon5': '0.072', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'FRAGCOUNT': '1.000', 'weapon3': '1.172', 'weapon2': '1.202', 'DAMAGECOUNT': '1.420'} +[2023-09-14 12:28:44,681][44162] DAMAGECOUNT value on done: 111.0 +[2023-09-14 12:28:44,682][44162] DAMAGECOUNT value on done: 28.0 +[2023-09-14 12:28:44,682][44162] Sum rewards: 2.317, reward structure: {'HEALTH': '-1.360', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon5': '0.124', 'WEAPON5': '0.200', 'weapon4': '0.226', 'DAMAGECOUNT': '0.280', 'WEAPON3': '0.400', 'weapon2': '0.522', 'weapon3': '2.810'} +[2023-09-14 12:28:44,707][109198] Fps is (10 sec: 14745.5, 60 sec: 11125.8, 300 sec: 11125.8). Total num frames: 1556480. Throughput: 0: 3022.8. Samples: 136028. Policy #0 lag: (min: 0.0, avg: 1.0, max: 2.0) +[2023-09-14 12:28:44,708][109198] Avg episode reward: [(0, '2.735')] +[2023-09-14 12:28:44,710][44016] Saving new best policy, reward=2.735! +[2023-09-14 12:28:45,077][44123] DAMAGECOUNT value on done: 55.0 +[2023-09-14 12:28:45,077][44123] DAMAGECOUNT value on done: 130.0 +[2023-09-14 12:28:45,078][44123] Sum rewards: -0.183, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.019', 'AMMO3': '0.038', 'AMMO4': '0.092', 'weapon5': '0.104', 'weapon2': '0.128', 'WEAPON5': '0.200', 'WEAPON3': '0.300', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.550', 'weapon4': '0.688', 'weapon3': '1.390'} +[2023-09-14 12:28:45,078][44123] Sum rewards: 4.327, reward structure: {'HEALTH': '-1.350', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.006', 'AMMO5': '0.008', 'AMMO4': '0.028', 'AMMO3': '0.044', 'WEAPON4': '0.100', 'weapon5': '0.170', 'weapon2': '0.174', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.458', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.300', 'weapon3': '2.790'} +[2023-09-14 12:28:45,200][44162] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:28:45,201][44162] Sum rewards: 4.018, reward structure: {'HEALTH': '-1.390', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.031', 'AMMO3': '0.044', 'weapon5': '0.102', 'AMMO4': '0.156', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.206', 'WEAPON3': '0.400', 'weapon4': '0.502', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '2.560'} +[2023-09-14 12:28:45,200][44162] DAMAGECOUNT value on done: 39.0 +[2023-09-14 12:28:45,629][44123] DAMAGECOUNT value on done: 242.0 +[2023-09-14 12:28:45,629][44123] DAMAGECOUNT value on done: 139.0 +[2023-09-14 12:28:45,630][44123] Sum rewards: 4.529, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.015', 'AMMO3': '0.041', 'weapon5': '0.050', 'AMMO4': '0.075', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.214', 'WEAPON3': '0.400', 'weapon2': '0.504', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.390', 'weapon3': '2.832'} +[2023-09-14 12:28:45,767][44162] DAMAGECOUNT value on done: 40.0 +[2023-09-14 12:28:45,767][44162] DAMAGECOUNT value on done: 76.0 +[2023-09-14 12:28:47,058][44091] Updated weights for policy 0, policy_version 388 (0.0013) +[2023-09-14 12:28:49,707][109198] Fps is (10 sec: 14336.0, 60 sec: 11387.0, 300 sec: 11387.0). Total num frames: 1626112. Throughput: 0: 3237.3. Samples: 146540. Policy #0 lag: (min: 0.0, avg: 1.2, max: 3.0) +[2023-09-14 12:28:49,708][109198] Avg episode reward: [(0, '2.739')] +[2023-09-14 12:28:49,711][44016] Saving new best policy, reward=2.739! +[2023-09-14 12:28:49,897][44091] Updated weights for policy 0, policy_version 398 (0.0011) +[2023-09-14 12:28:52,771][44091] Updated weights for policy 0, policy_version 408 (0.0013) +[2023-09-14 12:28:54,707][109198] Fps is (10 sec: 13926.5, 60 sec: 11603.7, 300 sec: 11603.7). Total num frames: 1695744. Throughput: 0: 3584.9. Samples: 168032. Policy #0 lag: (min: 0.0, avg: 0.9, max: 2.0) +[2023-09-14 12:28:54,708][109198] Avg episode reward: [(0, '2.739')] +[2023-09-14 12:28:55,526][44091] Updated weights for policy 0, policy_version 418 (0.0013) +[2023-09-14 12:28:56,364][44158] Large shaping reward 2.922 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 2.0), ('DAMAGECOUNT', 1.92, 192.0), ('weapon5', 0.002)] +[2023-09-14 12:28:58,413][44091] Updated weights for policy 0, policy_version 428 (0.0016) +[2023-09-14 12:28:59,707][109198] Fps is (10 sec: 14335.9, 60 sec: 12561.1, 300 sec: 11850.7). Total num frames: 1769472. Throughput: 0: 3584.1. Samples: 189648. Policy #0 lag: (min: 0.0, avg: 1.3, max: 3.0) +[2023-09-14 12:28:59,708][109198] Avg episode reward: [(0, '2.739')] +[2023-09-14 12:29:01,242][44091] Updated weights for policy 0, policy_version 438 (0.0012) +[2023-09-14 12:29:04,011][44091] Updated weights for policy 0, policy_version 448 (0.0013) +[2023-09-14 12:29:04,707][109198] Fps is (10 sec: 14745.6, 60 sec: 13789.9, 300 sec: 12061.7). Total num frames: 1843200. Throughput: 0: 3591.9. Samples: 200572. Policy #0 lag: (min: 0.0, avg: 1.3, max: 3.0) +[2023-09-14 12:29:04,708][109198] Avg episode reward: [(0, '2.739')] +[2023-09-14 12:29:06,835][44091] Updated weights for policy 0, policy_version 458 (0.0011) +[2023-09-14 12:29:09,707][109198] Fps is (10 sec: 14336.0, 60 sec: 14336.0, 300 sec: 12188.4). Total num frames: 1912832. Throughput: 0: 3580.0. Samples: 221940. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:29:09,708][109198] Avg episode reward: [(0, '2.739')] +[2023-09-14 12:29:09,808][44091] Updated weights for policy 0, policy_version 468 (0.0015) +[2023-09-14 12:29:12,580][44091] Updated weights for policy 0, policy_version 478 (0.0012) +[2023-09-14 12:29:14,707][109198] Fps is (10 sec: 13926.4, 60 sec: 14336.0, 300 sec: 12299.0). Total num frames: 1982464. Throughput: 0: 3598.0. Samples: 243592. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:29:14,708][109198] Avg episode reward: [(0, '2.739')] +[2023-09-14 12:29:15,489][44091] Updated weights for policy 0, policy_version 488 (0.0013) +[2023-09-14 12:29:17,982][44159] DAMAGECOUNT value on done: 666.0 +[2023-09-14 12:29:17,982][44159] DAMAGECOUNT value on done: 150.0 +[2023-09-14 12:29:17,983][44159] Sum rewards: 6.880, reward structure: {'HEALTH': '-1.920', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.005', 'AMMO4': '0.024', 'AMMO3': '0.030', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.262', 'WEAPON3': '0.300', 'weapon2': '0.366', 'weapon4': '0.462', 'weapon3': '1.486', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.460'} +[2023-09-14 12:29:17,984][44159] Sum rewards: -1.137, reward structure: {'HEALTH': '-4.000', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.010', 'AMMO4': '0.036', 'AMMO3': '0.072', 'weapon4': '0.190', 'WEAPON4': '0.200', 'weapon5': '0.298', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.680', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '2.420'} +[2023-09-14 12:29:18,496][44091] Updated weights for policy 0, policy_version 498 (0.0012) +[2023-09-14 12:29:18,573][44159] DAMAGECOUNT value on done: 140.0 +[2023-09-14 12:29:18,573][44159] Sum rewards: 3.365, reward structure: {'HEALTH': '-1.330', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.046', 'weapon5': '0.148', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.814', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.400', 'weapon3': '1.740'} +[2023-09-14 12:29:18,574][44159] DAMAGECOUNT value on done: 212.0 +[2023-09-14 12:29:18,772][44125] DAMAGECOUNT value on done: 60.0 +[2023-09-14 12:29:18,772][44125] DAMAGECOUNT value on done: 150.0 +[2023-09-14 12:29:19,150][44159] DAMAGECOUNT value on done: 180.0 +[2023-09-14 12:29:19,150][44159] DAMAGECOUNT value on done: 582.0 +[2023-09-14 12:29:19,151][44159] Sum rewards: 6.547, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.050', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.290', 'weapon4': '0.330', 'weapon2': '0.372', 'WEAPON3': '0.400', 'FRAGCOUNT': '2.000', 'weapon3': '2.420', 'DAMAGECOUNT': '2.930'} +[2023-09-14 12:29:19,395][44125] DAMAGECOUNT value on done: 345.0 +[2023-09-14 12:29:19,395][44125] DAMAGECOUNT value on done: 173.0 +[2023-09-14 12:29:19,396][44125] Sum rewards: 1.991, reward structure: {'HEALTH': '-1.480', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.036', 'WEAPON4': '0.100', 'weapon4': '0.102', 'WEAPON5': '0.200', 'weapon5': '0.250', 'WEAPON3': '0.300', 'weapon2': '0.374', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '1.050'} +[2023-09-14 12:29:19,523][44160] DAMAGECOUNT value on done: 223.0 +[2023-09-14 12:29:19,523][44160] DAMAGECOUNT value on done: 495.0 +[2023-09-14 12:29:19,524][44160] Sum rewards: 3.023, reward structure: {'HEALTH': '-0.780', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.021', 'weapon5': '0.042', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.370', 'weapon3': '0.994', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100'} +[2023-09-14 12:29:19,707][109198] Fps is (10 sec: 14336.0, 60 sec: 14404.3, 300 sec: 12445.3). Total num frames: 2056192. Throughput: 0: 3599.8. Samples: 254432. Policy #0 lag: (min: 0.0, avg: 1.1, max: 2.0) +[2023-09-14 12:29:19,708][109198] Avg episode reward: [(0, '2.695')] +[2023-09-14 12:29:19,720][44159] DAMAGECOUNT value on done: 73.0 +[2023-09-14 12:29:19,720][44159] DAMAGECOUNT value on done: 250.0 +[2023-09-14 12:29:19,721][44159] Sum rewards: 0.088, reward structure: {'HEALTH': '-2.020', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.028', 'AMMO2': '-0.006', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.011', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon5': '0.198', 'weapon4': '0.248', 'WEAPON5': '0.300', 'WEAPON3': '0.400', 'weapon2': '0.418', 'DAMAGECOUNT': '0.650', 'weapon3': '1.778'} +[2023-09-14 12:29:19,721][44159] Sum rewards: 4.359, reward structure: {'HEALTH': '-0.650', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'weapon2': '0.030', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.170', 'WEAPON3': '0.200', 'weapon4': '0.226', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.500', 'weapon3': '1.660'} +[2023-09-14 12:29:19,811][44161] DAMAGECOUNT value on done: 176.0 +[2023-09-14 12:29:19,812][44161] DAMAGECOUNT value on done: 429.0 +[2023-09-14 12:29:19,812][44161] Sum rewards: 1.009, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.007', 'AMMO5': '0.011', 'AMMO3': '0.069', 'weapon5': '0.152', 'DAMAGECOUNT': '0.300', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.674', 'weapon3': '2.996'} +[2023-09-14 12:29:19,813][44161] Sum rewards: 5.271, reward structure: {'HEALTH': '-0.300', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.015', 'AMMO3': '0.020', 'weapon2': '0.072', 'AMMO4': '0.075', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.102', 'WEAPON3': '0.200', 'weapon4': '0.588', 'FRAGCOUNT': '1.000', 'weapon3': '1.266', 'DAMAGECOUNT': '2.030'} +[2023-09-14 12:29:19,942][44125] DAMAGECOUNT value on done: 400.0 +[2023-09-14 12:29:19,942][44125] DAMAGECOUNT value on done: 165.0 +[2023-09-14 12:29:19,942][44125] Sum rewards: 3.377, reward structure: {'HEALTH': '-2.150', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.014', 'AMMO4': '0.015', 'weapon4': '0.066', 'AMMO3': '0.073', 'weapon5': '0.076', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'weapon2': '0.384', 'WEAPON3': '0.600', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.950', 'weapon3': '2.946'} +[2023-09-14 12:29:19,943][44125] Sum rewards: 3.150, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.025', 'AMMO3': '0.043', 'weapon2': '0.068', 'AMMO4': '0.123', 'weapon5': '0.272', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'WEAPON3': '0.400', 'weapon4': '0.598', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.500', 'weapon3': '2.508'} +[2023-09-14 12:29:19,966][44158] DAMAGECOUNT value on done: 125.0 +[2023-09-14 12:29:19,966][44158] DAMAGECOUNT value on done: 67.0 +[2023-09-14 12:29:20,063][44160] DAMAGECOUNT value on done: 135.0 +[2023-09-14 12:29:20,064][44160] DAMAGECOUNT value on done: 261.0 +[2023-09-14 12:29:20,064][44160] Sum rewards: 0.497, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.019', 'weapon2': '0.050', 'AMMO3': '0.060', 'AMMO4': '0.093', 'weapon5': '0.130', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.250', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon4': '0.600', 'weapon3': '2.288'} +[2023-09-14 12:29:20,065][44160] Sum rewards: 4.865, reward structure: {'HEALTH': '-1.250', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.019', 'AMMO2': '-0.004', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.240', 'weapon4': '0.286', 'weapon2': '0.296', 'WEAPON3': '0.400', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.960', 'weapon3': '2.612'} +[2023-09-14 12:29:20,299][44090] DAMAGECOUNT value on done: 110.0 +[2023-09-14 12:29:20,300][44090] DAMAGECOUNT value on done: 79.0 +[2023-09-14 12:29:20,300][44090] Sum rewards: 1.827, reward structure: {'HEALTH': '-1.080', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.049', 'AMMO2': '-0.010', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO3': '0.040', 'weapon5': '0.110', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.450', 'weapon2': '0.728', 'weapon3': '2.030'} +[2023-09-14 12:29:20,325][44161] DAMAGECOUNT value on done: 85.0 +[2023-09-14 12:29:20,325][44161] DAMAGECOUNT value on done: 200.0 +[2023-09-14 12:29:20,326][44161] Sum rewards: -0.268, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'FRAGCOUNT': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.017', 'AMMO2': '0.028', 'AMMO3': '0.070', 'AMMO4': '0.139', 'weapon5': '0.204', 'weapon2': '0.242', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.650', 'weapon4': '0.668', 'weapon3': '2.416'} +[2023-09-14 12:29:20,486][44125] DAMAGECOUNT value on done: 294.0 +[2023-09-14 12:29:20,486][44125] DAMAGECOUNT value on done: 260.0 +[2023-09-14 12:29:20,487][44125] Sum rewards: 4.473, reward structure: {'HEALTH': '-0.140', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'weapon2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.025', 'weapon5': '0.074', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.342', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.350', 'weapon3': '1.384'} +[2023-09-14 12:29:20,519][44158] DAMAGECOUNT value on done: 204.0 +[2023-09-14 12:29:20,520][44158] DAMAGECOUNT value on done: 229.0 +[2023-09-14 12:29:20,520][44158] Sum rewards: 4.134, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.049', 'weapon5': '0.158', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon2': '1.106', 'DAMAGECOUNT': '1.490', 'weapon3': '1.754'} +[2023-09-14 12:29:20,520][44158] Sum rewards: 2.742, reward structure: {'HEALTH': '-2.180', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.016', 'AMMO3': '0.072', 'weapon2': '0.076', 'AMMO4': '0.082', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.298', 'weapon4': '0.536', 'WEAPON3': '0.600', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '2.834'} +[2023-09-14 12:29:20,607][44160] DAMAGECOUNT value on done: 245.0 +[2023-09-14 12:29:20,608][44160] DAMAGECOUNT value on done: 334.0 +[2023-09-14 12:29:20,608][44160] Sum rewards: 4.027, reward structure: {'HEALTH': '-1.800', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.006', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.350', 'WEAPON3': '0.400', 'weapon2': '0.426', 'weapon5': '0.436', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.490', 'weapon3': '2.380'} +[2023-09-14 12:29:20,608][44160] Sum rewards: 2.354, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.014', 'AMMO3': '0.058', 'AMMO4': '0.071', 'WEAPON4': '0.100', 'weapon5': '0.114', 'WEAPON5': '0.200', 'weapon4': '0.244', 'weapon2': '0.398', 'WEAPON3': '0.500', 'DAMAGECOUNT': '1.550', 'weapon3': '3.096'} +[2023-09-14 12:29:20,885][44090] DAMAGECOUNT value on done: 140.0 +[2023-09-14 12:29:20,885][44090] DAMAGECOUNT value on done: 162.0 +[2023-09-14 12:29:20,886][44090] Sum rewards: 3.251, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.024', 'AMMO3': '0.075', 'weapon2': '0.086', 'AMMO4': '0.118', 'weapon5': '0.132', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.410', 'WEAPON3': '0.600', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.400', 'weapon3': '2.998'} +[2023-09-14 12:29:20,886][44090] Sum rewards: 3.601, reward structure: {'HEALTH': '-1.650', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.009', 'AMMO3': '0.045', 'AMMO4': '0.045', 'WEAPON4': '0.100', 'weapon5': '0.106', 'weapon4': '0.196', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.898', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.620', 'weapon3': '1.626'} +[2023-09-14 12:29:20,903][44161] DAMAGECOUNT value on done: 225.0 +[2023-09-14 12:29:20,904][44161] DAMAGECOUNT value on done: 265.0 +[2023-09-14 12:29:20,904][44161] Sum rewards: 2.252, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.020', 'AMMO3': '0.046', 'weapon2': '0.046', 'AMMO4': '0.097', 'weapon5': '0.168', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'WEAPON3': '0.400', 'weapon4': '0.936', 'FRAGCOUNT': '0.998', 'DAMAGECOUNT': '1.200', 'weapon3': '1.726'} +[2023-09-14 12:29:20,905][44161] Sum rewards: 1.020, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.051', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.210', 'weapon4': '0.236', 'DAMAGECOUNT': '0.450', 'weapon2': '0.484', 'WEAPON3': '0.500', 'weapon3': '2.814'} +[2023-09-14 12:29:21,165][44158] DAMAGECOUNT value on done: 413.0 +[2023-09-14 12:29:21,166][44158] DAMAGECOUNT value on done: 427.0 +[2023-09-14 12:29:21,166][44158] Sum rewards: 1.850, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.011', 'AMMO3': '0.074', 'WEAPON4': '0.100', 'weapon5': '0.124', 'WEAPON5': '0.300', 'weapon4': '0.324', 'weapon2': '0.570', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.730', 'FRAGCOUNT': '1.999', 'weapon3': '2.030'} +[2023-09-14 12:29:21,167][44158] Sum rewards: 5.298, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.009', 'AMMO4': '0.021', 'AMMO3': '0.088', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.282', 'weapon2': '0.372', 'weapon4': '0.494', 'WEAPON3': '0.600', 'weapon3': '1.808', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '3.220'} +[2023-09-14 12:29:21,213][44123] DAMAGECOUNT value on done: 270.0 +[2023-09-14 12:29:21,213][44123] DAMAGECOUNT value on done: 53.0 +[2023-09-14 12:29:21,214][44123] Sum rewards: 4.371, reward structure: {'HEALTH': '-1.430', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.030', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.164', 'WEAPON3': '0.300', 'weapon4': '0.310', 'weapon2': '0.380', 'FRAGCOUNT': '1.000', 'weapon3': '1.864', 'DAMAGECOUNT': '2.550'} +[2023-09-14 12:29:21,235][44160] DAMAGECOUNT value on done: 165.0 +[2023-09-14 12:29:21,236][44160] DAMAGECOUNT value on done: 210.0 +[2023-09-14 12:29:21,236][44160] Sum rewards: 2.678, reward structure: {'HEALTH': '-1.250', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.050', 'WEAPON4': '0.100', 'weapon4': '0.120', 'WEAPON5': '0.200', 'weapon5': '0.258', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.400', 'weapon2': '1.138', 'weapon3': '2.204'} +[2023-09-14 12:29:21,236][44160] Sum rewards: 1.636, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.051', 'weapon5': '0.190', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.250', 'weapon4': '0.318', 'weapon2': '0.380', 'WEAPON3': '0.400', 'weapon3': '1.940'} +[2023-09-14 12:29:21,335][44091] Updated weights for policy 0, policy_version 508 (0.0014) +[2023-09-14 12:29:21,474][44161] DAMAGECOUNT value on done: 110.0 +[2023-09-14 12:29:21,474][44161] DAMAGECOUNT value on done: 170.0 +[2023-09-14 12:29:21,487][44090] DAMAGECOUNT value on done: 120.0 +[2023-09-14 12:29:21,487][44090] DAMAGECOUNT value on done: 160.0 +[2023-09-14 12:29:21,488][44090] Sum rewards: 4.139, reward structure: {'HEALTH': '-0.250', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'weapon2': '0.038', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.136', 'WEAPON3': '0.200', 'weapon4': '0.328', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.434'} +[2023-09-14 12:29:21,771][44158] DAMAGECOUNT value on done: 29.0 +[2023-09-14 12:29:21,771][44158] DAMAGECOUNT value on done: 252.0 +[2023-09-14 12:29:21,772][44158] Sum rewards: 5.748, reward structure: {'HEALTH': '-0.460', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'AMMO2': '0.023', 'weapon5': '0.070', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.116', 'WEAPON3': '0.200', 'weapon2': '0.402', 'weapon4': '0.546', 'weapon3': '1.108', 'DAMAGECOUNT': '1.520', 'FRAGCOUNT': '2.000'} +[2023-09-14 12:29:21,775][44123] DAMAGECOUNT value on done: 380.0 +[2023-09-14 12:29:21,775][44123] DAMAGECOUNT value on done: 247.0 +[2023-09-14 12:29:21,775][44123] Sum rewards: 7.820, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'weapon2': '0.010', 'AMMO2': '0.025', 'AMMO3': '0.050', 'weapon5': '0.070', 'AMMO4': '0.125', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.318', 'WEAPON3': '0.400', 'weapon3': '2.364', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.050'} +[2023-09-14 12:29:21,776][44123] Sum rewards: 0.910, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.050', 'AMMO3': '0.096', 'WEAPON4': '0.200', 'weapon4': '0.252', 'WEAPON5': '0.300', 'weapon5': '0.310', 'weapon2': '0.372', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '2.558'} +[2023-09-14 12:29:22,126][44090] DAMAGECOUNT value on done: 70.0 +[2023-09-14 12:29:22,126][44090] DAMAGECOUNT value on done: 349.0 +[2023-09-14 12:29:22,126][44090] Sum rewards: -1.132, reward structure: {'HEALTH': '-3.020', 'DEATHCOUNT': '-3.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.014', 'AMMO5': '0.014', 'AMMO4': '0.069', 'AMMO3': '0.071', 'weapon5': '0.080', 'WEAPON4': '0.200', 'weapon4': '0.208', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.550', 'weapon2': '0.570', 'WEAPON3': '0.600', 'weapon3': '2.212'} +[2023-09-14 12:29:22,127][44090] Sum rewards: 6.179, reward structure: {'HEALTH': '-0.550', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'weapon5': '0.090', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.380', 'weapon3': '1.376', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.590'} +[2023-09-14 12:29:22,371][44123] DAMAGECOUNT value on done: 351.0 +[2023-09-14 12:29:22,372][44123] DAMAGECOUNT value on done: 330.0 +[2023-09-14 12:29:22,372][44123] Sum rewards: 6.230, reward structure: {'HEALTH': '-1.440', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.052', 'WEAPON4': '0.100', 'weapon5': '0.156', 'WEAPON5': '0.200', 'weapon4': '0.266', 'WEAPON3': '0.400', 'weapon2': '0.650', 'FRAGCOUNT': '2.000', 'weapon3': '2.038', 'DAMAGECOUNT': '2.750'} +[2023-09-14 12:29:22,510][44162] DAMAGECOUNT value on done: 136.0 +[2023-09-14 12:29:22,510][44162] DAMAGECOUNT value on done: 219.0 +[2023-09-14 12:29:22,511][44162] Sum rewards: 3.755, reward structure: {'HEALTH': '-0.710', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'weapon2': '0.048', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.130', 'WEAPON3': '0.200', 'weapon4': '0.232', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.140', 'weapon3': '1.492'} +[2023-09-14 12:29:22,901][44123] DAMAGECOUNT value on done: 352.0 +[2023-09-14 12:29:22,901][44123] DAMAGECOUNT value on done: 209.0 +[2023-09-14 12:29:22,901][44123] Sum rewards: 2.547, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.059', 'weapon5': '0.194', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'FRAGCOUNT': '0.998', 'DAMAGECOUNT': '1.100', 'weapon2': '1.132', 'weapon3': '2.386'} +[2023-09-14 12:29:23,091][44162] DAMAGECOUNT value on done: 133.0 +[2023-09-14 12:29:23,092][44162] Sum rewards: 3.802, reward structure: {'HEALTH': '-0.050', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO3': '0.020', 'WEAPON3': '0.200', 'weapon2': '0.378', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.234'} +[2023-09-14 12:29:23,092][44162] DAMAGECOUNT value on done: 116.0 +[2023-09-14 12:29:23,659][44162] DAMAGECOUNT value on done: 276.0 +[2023-09-14 12:29:23,660][44162] DAMAGECOUNT value on done: 270.0 +[2023-09-14 12:29:23,660][44162] Sum rewards: 3.489, reward structure: {'HEALTH': '-1.650', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.007', 'weapon2': '0.010', 'AMMO4': '0.025', 'AMMO3': '0.033', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.220', 'WEAPON3': '0.300', 'weapon4': '0.390', 'FRAGCOUNT': '1.000', 'weapon3': '1.478', 'DAMAGECOUNT': '2.370'} +[2023-09-14 12:29:23,660][44162] Sum rewards: 1.455, reward structure: {'HEALTH': '-2.820', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.060', 'WEAPON4': '0.100', 'weapon4': '0.158', 'WEAPON5': '0.200', 'weapon5': '0.208', 'WEAPON3': '0.500', 'weapon2': '0.512', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.700', 'weapon3': '1.858'} +[2023-09-14 12:29:24,086][44091] Updated weights for policy 0, policy_version 518 (0.0012) +[2023-09-14 12:29:24,202][44162] DAMAGECOUNT value on done: 200.0 +[2023-09-14 12:29:24,203][44162] Sum rewards: 4.144, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'weapon5': '0.052', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.402', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.600', 'weapon3': '2.474'} +[2023-09-14 12:29:24,203][44162] DAMAGECOUNT value on done: 241.0 +[2023-09-14 12:29:24,707][109198] Fps is (10 sec: 14745.6, 60 sec: 14404.3, 300 sec: 12575.1). Total num frames: 2129920. Throughput: 0: 3583.9. Samples: 275544. Policy #0 lag: (min: 0.0, avg: 1.4, max: 3.0) +[2023-09-14 12:29:24,708][109198] Avg episode reward: [(0, '2.642')] +[2023-09-14 12:29:27,018][44091] Updated weights for policy 0, policy_version 528 (0.0014) +[2023-09-14 12:29:29,707][109198] Fps is (10 sec: 14336.0, 60 sec: 14404.3, 300 sec: 12647.3). Total num frames: 2199552. Throughput: 0: 3577.9. Samples: 297032. Policy #0 lag: (min: 0.0, avg: 1.1, max: 3.0) +[2023-09-14 12:29:29,708][109198] Avg episode reward: [(0, '2.642')] +[2023-09-14 12:29:29,948][44091] Updated weights for policy 0, policy_version 538 (0.0011) +[2023-09-14 12:29:33,254][44091] Updated weights for policy 0, policy_version 548 (0.0013) +[2023-09-14 12:29:34,707][109198] Fps is (10 sec: 13516.8, 60 sec: 14267.7, 300 sec: 12670.7). Total num frames: 2265088. Throughput: 0: 3556.6. Samples: 306588. Policy #0 lag: (min: 0.0, avg: 1.1, max: 2.0) +[2023-09-14 12:29:34,708][109198] Avg episode reward: [(0, '2.642')] +[2023-09-14 12:29:36,224][44091] Updated weights for policy 0, policy_version 558 (0.0013) +[2023-09-14 12:29:39,279][44091] Updated weights for policy 0, policy_version 568 (0.0013) +[2023-09-14 12:29:39,707][109198] Fps is (10 sec: 13107.2, 60 sec: 14131.2, 300 sec: 12691.7). Total num frames: 2330624. Throughput: 0: 3518.8. Samples: 326376. Policy #0 lag: (min: 0.0, avg: 1.0, max: 3.0) +[2023-09-14 12:29:39,708][109198] Avg episode reward: [(0, '2.642')] +[2023-09-14 12:29:42,194][44091] Updated weights for policy 0, policy_version 578 (0.0015) +[2023-09-14 12:29:44,707][109198] Fps is (10 sec: 13516.8, 60 sec: 14062.9, 300 sec: 12748.6). Total num frames: 2400256. Throughput: 0: 3514.9. Samples: 347820. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:29:44,708][109198] Avg episode reward: [(0, '2.642')] +[2023-09-14 12:29:45,099][44091] Updated weights for policy 0, policy_version 588 (0.0013) +[2023-09-14 12:29:47,885][44091] Updated weights for policy 0, policy_version 598 (0.0016) +[2023-09-14 12:29:49,707][109198] Fps is (10 sec: 13926.4, 60 sec: 14062.9, 300 sec: 12800.4). Total num frames: 2469888. Throughput: 0: 3512.2. Samples: 358620. Policy #0 lag: (min: 0.0, avg: 1.1, max: 2.0) +[2023-09-14 12:29:49,708][109198] Avg episode reward: [(0, '2.642')] +[2023-09-14 12:29:49,714][44016] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000603_2469888.pth... +[2023-09-14 12:29:49,777][44016] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000246_1007616.pth +[2023-09-14 12:29:51,009][44091] Updated weights for policy 0, policy_version 608 (0.0013) +[2023-09-14 12:29:53,993][44091] Updated weights for policy 0, policy_version 618 (0.0014) +[2023-09-14 12:29:54,707][109198] Fps is (10 sec: 13926.4, 60 sec: 14062.9, 300 sec: 12847.9). Total num frames: 2539520. Throughput: 0: 3476.6. Samples: 378388. Policy #0 lag: (min: 0.0, avg: 1.0, max: 2.0) +[2023-09-14 12:29:54,708][109198] Avg episode reward: [(0, '2.642')] +[2023-09-14 12:29:56,046][44159] DAMAGECOUNT value on done: 771.0 +[2023-09-14 12:29:56,046][44159] DAMAGECOUNT value on done: 284.0 +[2023-09-14 12:29:56,047][44159] Sum rewards: 3.816, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.010', 'AMMO3': '0.043', 'AMMO4': '0.050', 'weapon5': '0.054', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.280', 'WEAPON3': '0.400', 'weapon2': '0.478', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '2.344'} +[2023-09-14 12:29:56,047][44159] Sum rewards: 4.504, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.478', 'weapon2': '0.738', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.340', 'weapon3': '2.302'} +[2023-09-14 12:29:56,615][44159] DAMAGECOUNT value on done: 482.0 +[2023-09-14 12:29:56,615][44159] DAMAGECOUNT value on done: 290.0 +[2023-09-14 12:29:56,615][44159] Sum rewards: 5.953, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.014', 'AMMO3': '0.042', 'weapon4': '0.050', 'AMMO4': '0.068', 'WEAPON4': '0.100', 'weapon5': '0.198', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.402', 'FRAGCOUNT': '2.000', 'weapon3': '2.172', 'DAMAGECOUNT': '2.700'} +[2023-09-14 12:29:56,616][44159] Sum rewards: 3.293, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.050', 'WEAPON4': '0.100', 'weapon4': '0.276', 'WEAPON5': '0.300', 'weapon5': '0.312', 'WEAPON3': '0.500', 'weapon2': '0.560', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.500', 'weapon3': '2.680'} +[2023-09-14 12:29:56,916][44091] Updated weights for policy 0, policy_version 628 (0.0014) +[2023-09-14 12:29:57,069][44125] DAMAGECOUNT value on done: 165.0 +[2023-09-14 12:29:57,069][44125] DAMAGECOUNT value on done: 345.0 +[2023-09-14 12:29:57,069][44125] Sum rewards: 4.036, reward structure: {'HEALTH': '-1.550', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.012', 'AMMO3': '0.040', 'weapon5': '0.054', 'AMMO4': '0.058', 'weapon4': '0.074', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon2': '1.212', 'weapon3': '2.378'} +[2023-09-14 12:29:57,070][44125] Sum rewards: 3.002, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'weapon4': '0.014', 'AMMO2': '0.015', 'AMMO3': '0.033', 'weapon5': '0.044', 'AMMO4': '0.073', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.352', 'FRAGCOUNT': '1.000', 'weapon3': '1.514', 'DAMAGECOUNT': '1.950'} +[2023-09-14 12:29:57,212][44159] DAMAGECOUNT value on done: 210.0 +[2023-09-14 12:29:57,212][44159] DAMAGECOUNT value on done: 750.0 +[2023-09-14 12:29:57,213][44159] Sum rewards: 4.421, reward structure: {'HEALTH': '-0.300', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'weapon5': '0.076', 'weapon4': '0.098', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.386', 'FRAGCOUNT': '1.000', 'weapon3': '1.058', 'DAMAGECOUNT': '1.680'} +[2023-09-14 12:29:57,732][44125] DAMAGECOUNT value on done: 516.0 +[2023-09-14 12:29:57,732][44125] Sum rewards: 4.733, reward structure: {'HEALTH': '-0.250', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.050', 'weapon2': '0.066', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.186', 'WEAPON3': '0.200', 'weapon4': '0.450', 'FRAGCOUNT': '1.000', 'weapon3': '1.088', 'DAMAGECOUNT': '1.710'} +[2023-09-14 12:29:57,733][44125] DAMAGECOUNT value on done: 198.0 +[2023-09-14 12:29:57,838][44159] DAMAGECOUNT value on done: 173.0 +[2023-09-14 12:29:57,838][44159] DAMAGECOUNT value on done: 360.0 +[2023-09-14 12:29:57,838][44159] Sum rewards: 1.165, reward structure: {'HEALTH': '-3.050', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.017', 'AMMO2': '0.035', 'AMMO3': '0.069', 'weapon2': '0.154', 'weapon5': '0.166', 'AMMO4': '0.175', 'weapon4': '0.292', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'WEAPON3': '0.600', 'FRAGCOUNT': '0.998', 'DAMAGECOUNT': '1.000', 'weapon3': '3.008'} +[2023-09-14 12:29:57,839][44159] Sum rewards: 3.280, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.049', 'WEAPON4': '0.100', 'weapon4': '0.118', 'weapon5': '0.176', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.454', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '1.684'} +[2023-09-14 12:29:57,879][44160] DAMAGECOUNT value on done: 258.0 +[2023-09-14 12:29:57,880][44160] DAMAGECOUNT value on done: 620.0 +[2023-09-14 12:29:57,880][44160] Sum rewards: 4.373, reward structure: {'HEALTH': '-0.350', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.104', 'WEAPON3': '0.200', 'weapon5': '0.292', 'weapon2': '0.746', 'weapon3': '0.878', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.250'} +[2023-09-14 12:29:58,188][44161] DAMAGECOUNT value on done: 384.0 +[2023-09-14 12:29:58,189][44161] DAMAGECOUNT value on done: 531.0 +[2023-09-14 12:29:58,189][44161] Sum rewards: 4.795, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.008', 'AMMO3': '0.039', 'AMMO4': '0.039', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon5': '0.292', 'WEAPON3': '0.300', 'weapon4': '0.332', 'weapon2': '0.450', 'weapon3': '0.952', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.080'} +[2023-09-14 12:29:58,190][44161] Sum rewards: 2.032, reward structure: {'HEALTH': '-2.180', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'AMMO2': '0.021', 'AMMO3': '0.084', 'AMMO4': '0.105', 'weapon5': '0.188', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.316', 'weapon2': '0.364', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.020', 'weapon3': '2.000'} +[2023-09-14 12:29:58,364][44125] DAMAGECOUNT value on done: 655.0 +[2023-09-14 12:29:58,364][44125] DAMAGECOUNT value on done: 195.0 +[2023-09-14 12:29:58,365][44125] Sum rewards: 6.946, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.050', 'weapon2': '0.184', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.316', 'WEAPON3': '0.400', 'weapon4': '0.604', 'FRAGCOUNT': '1.999', 'weapon3': '2.436', 'DAMAGECOUNT': '2.550'} +[2023-09-14 12:29:58,365][44125] Sum rewards: -1.040, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO4': '0.001', 'AMMO5': '0.009', 'AMMO3': '0.050', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.300', 'weapon4': '0.308', 'weapon5': '0.392', 'weapon2': '0.456', 'WEAPON3': '0.500', 'weapon3': '2.544'} +[2023-09-14 12:29:58,515][44160] DAMAGECOUNT value on done: 341.0 +[2023-09-14 12:29:58,516][44160] Sum rewards: 3.932, reward structure: {'HEALTH': '-2.400', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.009', 'AMMO5': '0.014', 'AMMO4': '0.043', 'AMMO3': '0.058', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon5': '0.330', 'weapon4': '0.472', 'WEAPON3': '0.500', 'weapon2': '0.596', 'weapon3': '1.752', 'FRAGCOUNT': '1.998', 'DAMAGECOUNT': '2.060'} +[2023-09-14 12:29:58,515][44160] DAMAGECOUNT value on done: 401.0 +[2023-09-14 12:29:58,801][44161] DAMAGECOUNT value on done: 203.0 +[2023-09-14 12:29:58,801][44161] DAMAGECOUNT value on done: 205.0 +[2023-09-14 12:29:58,802][44161] Sum rewards: 4.321, reward structure: {'HEALTH': '-0.050', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'weapon5': '0.062', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.196', 'WEAPON3': '0.200', 'weapon2': '0.356', 'FRAGCOUNT': '1.000', 'weapon3': '1.124', 'DAMAGECOUNT': '1.180'} +[2023-09-14 12:29:58,947][44125] DAMAGECOUNT value on done: 294.0 +[2023-09-14 12:29:58,947][44125] DAMAGECOUNT value on done: 260.0 +[2023-09-14 12:29:59,105][44160] DAMAGECOUNT value on done: 500.0 +[2023-09-14 12:29:59,106][44160] Sum rewards: 3.725, reward structure: {'HEALTH': '-3.150', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'weapon2': '0.010', 'AMMO2': '0.012', 'AMMO5': '0.019', 'AMMO4': '0.061', 'AMMO3': '0.093', 'WEAPON4': '0.300', 'weapon5': '0.314', 'weapon4': '0.386', 'WEAPON5': '0.400', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.550', 'weapon3': '3.030'} +[2023-09-14 12:29:59,106][44160] DAMAGECOUNT value on done: 584.0 +[2023-09-14 12:29:59,106][44160] Sum rewards: 5.060, reward structure: {'HEALTH': '-2.350', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'AMMO2': '0.021', 'AMMO3': '0.076', 'weapon4': '0.092', 'WEAPON4': '0.100', 'AMMO4': '0.102', 'weapon5': '0.132', 'WEAPON5': '0.300', 'weapon2': '0.426', 'WEAPON3': '0.600', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.500', 'weapon3': '3.048'} +[2023-09-14 12:29:59,439][44161] DAMAGECOUNT value on done: 240.0 +[2023-09-14 12:29:59,439][44161] DAMAGECOUNT value on done: 395.0 +[2023-09-14 12:29:59,440][44161] Sum rewards: 5.128, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO4': '0.025', 'AMMO3': '0.030', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.226', 'WEAPON3': '0.300', 'weapon5': '0.586', 'weapon2': '0.968', 'DAMAGECOUNT': '1.300', 'weapon3': '1.636', 'FRAGCOUNT': '1.999'} +[2023-09-14 12:29:59,661][44160] DAMAGECOUNT value on done: 370.0 +[2023-09-14 12:29:59,661][44160] DAMAGECOUNT value on done: 295.0 +[2023-09-14 12:29:59,662][44160] Sum rewards: 3.253, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.060', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.340', 'weapon2': '0.364', 'weapon5': '0.446', 'WEAPON3': '0.500', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '2.050', 'weapon3': '2.188'} +[2023-09-14 12:29:59,662][44160] Sum rewards: 2.694, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.013', 'AMMO4': '0.021', 'AMMO3': '0.053', 'weapon4': '0.088', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'weapon5': '0.464', 'WEAPON3': '0.500', 'weapon2': '0.828', 'DAMAGECOUNT': '0.850', 'FRAGCOUNT': '0.999', 'weapon3': '2.574'} +[2023-09-14 12:29:59,707][109198] Fps is (10 sec: 13516.9, 60 sec: 13926.4, 300 sec: 12858.4). Total num frames: 2605056. Throughput: 0: 3455.6. Samples: 399096. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:29:59,708][109198] Avg episode reward: [(0, '2.820')] +[2023-09-14 12:29:59,738][44158] DAMAGECOUNT value on done: 235.0 +[2023-09-14 12:29:59,738][44158] DAMAGECOUNT value on done: 172.0 +[2023-09-14 12:29:59,739][44158] Sum rewards: 3.629, reward structure: {'HEALTH': '-1.330', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.310', 'weapon4': '0.312', 'weapon2': '0.368', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '2.122'} +[2023-09-14 12:29:59,739][44158] Sum rewards: 1.087, reward structure: {'HEALTH': '-2.050', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.009', 'weapon5': '0.040', 'AMMO3': '0.041', 'weapon4': '0.056', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.462', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '1.774'} +[2023-09-14 12:29:59,775][44016] Saving new best policy, reward=2.820! +[2023-09-14 12:29:59,918][44091] Updated weights for policy 0, policy_version 638 (0.0013) +[2023-09-14 12:29:59,986][44161] DAMAGECOUNT value on done: 264.0 +[2023-09-14 12:29:59,986][44161] DAMAGECOUNT value on done: 385.0 +[2023-09-14 12:29:59,986][44161] Sum rewards: 3.604, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.059', 'WEAPON4': '0.100', 'weapon5': '0.170', 'weapon4': '0.196', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'weapon2': '0.732', 'DAMAGECOUNT': '1.540', 'FRAGCOUNT': '2.000', 'weapon3': '2.100'} +[2023-09-14 12:29:59,987][44161] Sum rewards: 4.429, reward structure: {'HEALTH': '-2.300', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.012', 'AMMO4': '0.024', 'AMMO3': '0.057', 'weapon2': '0.132', 'weapon5': '0.256', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'WEAPON3': '0.500', 'weapon4': '0.710', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150', 'weapon3': '2.282'} +[2023-09-14 12:30:00,208][44123] DAMAGECOUNT value on done: 375.0 +[2023-09-14 12:30:00,209][44123] DAMAGECOUNT value on done: 580.0 +[2023-09-14 12:30:00,209][44123] Sum rewards: -0.781, reward structure: {'HEALTH': '-4.350', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.015', 'AMMO4': '0.020', 'weapon5': '0.078', 'WEAPON4': '0.100', 'AMMO3': '0.139', 'weapon4': '0.256', 'WEAPON5': '0.300', 'weapon2': '0.340', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '3.266'} +[2023-09-14 12:30:00,210][44123] Sum rewards: 8.569, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.052', 'WEAPON4': '0.100', 'weapon4': '0.208', 'weapon5': '0.270', 'WEAPON5': '0.300', 'weapon2': '0.370', 'WEAPON3': '0.500', 'weapon3': '2.518', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '5.270'} +[2023-09-14 12:30:00,213][44090] DAMAGECOUNT value on done: 165.0 +[2023-09-14 12:30:00,213][44090] DAMAGECOUNT value on done: 214.0 +[2023-09-14 12:30:00,213][44090] Sum rewards: 3.295, reward structure: {'HEALTH': '-1.900', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.005', 'AMMO4': '0.024', 'weapon2': '0.028', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.550', 'weapon4': '0.582', 'weapon5': '0.740', 'FRAGCOUNT': '0.999', 'weapon3': '2.422'} +[2023-09-14 12:30:00,392][44158] DAMAGECOUNT value on done: 309.0 +[2023-09-14 12:30:00,392][44158] DAMAGECOUNT value on done: 439.0 +[2023-09-14 12:30:00,393][44158] Sum rewards: 3.258, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.044', 'AMMO3': '0.073', 'weapon5': '0.156', 'weapon2': '0.180', 'AMMO4': '0.218', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.570', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '2.752'} +[2023-09-14 12:30:00,393][44158] Sum rewards: 5.773, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.007', 'AMMO4': '0.012', 'AMMO3': '0.043', 'weapon4': '0.060', 'WEAPON4': '0.100', 'weapon5': '0.138', 'WEAPON5': '0.200', 'weapon2': '0.368', 'WEAPON3': '0.400', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100', 'weapon3': '2.442'} +[2023-09-14 12:30:00,786][44123] DAMAGECOUNT value on done: 517.0 +[2023-09-14 12:30:00,787][44123] DAMAGECOUNT value on done: 279.0 +[2023-09-14 12:30:00,787][44123] Sum rewards: 4.317, reward structure: {'HEALTH': '-0.320', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon5': '0.266', 'weapon2': '0.700', 'weapon3': '0.978', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.370'} +[2023-09-14 12:30:00,820][44090] DAMAGECOUNT value on done: 182.0 +[2023-09-14 12:30:00,821][44090] DAMAGECOUNT value on done: 265.0 +[2023-09-14 12:30:00,821][44090] Sum rewards: 2.013, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.009', 'AMMO4': '0.024', 'AMMO3': '0.040', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.200', 'weapon5': '0.296', 'weapon2': '0.346', 'WEAPON3': '0.400', 'weapon4': '0.424', 'weapon3': '2.370'} +[2023-09-14 12:30:00,822][44090] Sum rewards: 2.977, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.030', 'AMMO4': '0.099', 'WEAPON5': '0.100', 'weapon5': '0.196', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.442', 'weapon4': '0.746', 'DAMAGECOUNT': '1.250', 'weapon3': '1.640'} +[2023-09-14 12:30:00,984][44158] DAMAGECOUNT value on done: 613.0 +[2023-09-14 12:30:00,985][44158] DAMAGECOUNT value on done: 613.0 +[2023-09-14 12:30:00,985][44158] Sum rewards: 4.060, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.010', 'AMMO4': '0.050', 'AMMO3': '0.076', 'WEAPON4': '0.100', 'weapon5': '0.116', 'weapon4': '0.150', 'WEAPON5': '0.200', 'WEAPON3': '0.600', 'FRAGCOUNT': '0.999', 'weapon2': '1.040', 'DAMAGECOUNT': '2.000', 'weapon3': '2.710'} +[2023-09-14 12:30:00,986][44158] Sum rewards: 4.363, reward structure: {'HEALTH': '-1.950', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.050', 'weapon2': '0.062', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.468', 'weapon4': '0.476', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.860', 'weapon3': '2.540'} +[2023-09-14 12:30:01,380][44090] DAMAGECOUNT value on done: 232.0 +[2023-09-14 12:30:01,381][44090] DAMAGECOUNT value on done: 250.0 +[2023-09-14 12:30:01,381][44090] Sum rewards: 3.600, reward structure: {'HEALTH': '-0.900', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.024', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.198', 'WEAPON3': '0.200', 'weapon2': '0.352', 'weapon5': '0.418', 'weapon3': '0.960', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.120'} +[2023-09-14 12:30:01,381][44090] Sum rewards: 1.736, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.008', 'AMMO5': '0.013', 'AMMO4': '0.037', 'AMMO3': '0.061', 'weapon4': '0.066', 'WEAPON4': '0.100', 'weapon2': '0.144', 'weapon5': '0.168', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.900', 'weapon3': '3.340'} +[2023-09-14 12:30:01,409][44123] DAMAGECOUNT value on done: 489.0 +[2023-09-14 12:30:01,409][44123] DAMAGECOUNT value on done: 481.0 +[2023-09-14 12:30:01,410][44123] Sum rewards: 2.689, reward structure: {'HEALTH': '-1.530', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO3': '0.030', 'weapon5': '0.088', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.210', 'WEAPON3': '0.300', 'weapon2': '0.354', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.380', 'weapon3': '1.684'} +[2023-09-14 12:30:01,603][44158] DAMAGECOUNT value on done: 39.0 +[2023-09-14 12:30:01,603][44158] DAMAGECOUNT value on done: 427.0 +[2023-09-14 12:30:01,604][44158] Sum rewards: 5.390, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.020', 'AMMO3': '0.040', 'weapon2': '0.090', 'AMMO4': '0.099', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.370', 'WEAPON3': '0.400', 'weapon4': '0.854', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.750', 'weapon3': '2.460'} +[2023-09-14 12:30:01,959][44090] DAMAGECOUNT value on done: 307.0 +[2023-09-14 12:30:01,959][44090] DAMAGECOUNT value on done: 457.0 +[2023-09-14 12:30:01,960][44090] Sum rewards: 5.721, reward structure: {'HEALTH': '-1.710', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.006', 'AMMO4': '0.025', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.214', 'weapon5': '0.218', 'weapon2': '0.350', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.370', 'weapon3': '2.504'} +[2023-09-14 12:30:01,971][44123] DAMAGECOUNT value on done: 319.0 +[2023-09-14 12:30:01,971][44123] DAMAGECOUNT value on done: 497.0 +[2023-09-14 12:30:01,971][44123] Sum rewards: 2.765, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.011', 'AMMO3': '0.073', 'WEAPON4': '0.100', 'weapon4': '0.220', 'weapon5': '0.244', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.732', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.100', 'weapon3': '2.386'} +[2023-09-14 12:30:01,972][44123] Sum rewards: 3.653, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.020', 'AMMO3': '0.037', 'WEAPON5': '0.100', 'AMMO4': '0.101', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.304', 'weapon4': '0.356', 'weapon5': '0.538', 'FRAGCOUNT': '1.000', 'weapon3': '1.244', 'DAMAGECOUNT': '1.450'} +[2023-09-14 12:30:02,470][44162] DAMAGECOUNT value on done: 171.0 +[2023-09-14 12:30:02,470][44162] DAMAGECOUNT value on done: 313.0 +[2023-09-14 12:30:02,888][44091] Updated weights for policy 0, policy_version 648 (0.0014) +[2023-09-14 12:30:03,050][44162] DAMAGECOUNT value on done: 248.0 +[2023-09-14 12:30:03,050][44162] DAMAGECOUNT value on done: 326.0 +[2023-09-14 12:30:03,050][44162] Sum rewards: 1.832, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.058', 'weapon5': '0.068', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.310', 'weapon2': '0.346', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon3': '2.092'} +[2023-09-14 12:30:03,051][44162] Sum rewards: 5.677, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.008', 'AMMO4': '0.014', 'AMMO3': '0.044', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.216', 'weapon5': '0.236', 'WEAPON3': '0.400', 'weapon2': '0.554', 'weapon3': '1.952', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:30:03,610][44162] DAMAGECOUNT value on done: 346.0 +[2023-09-14 12:30:03,610][44162] DAMAGECOUNT value on done: 370.0 +[2023-09-14 12:30:03,611][44162] Sum rewards: 3.744, reward structure: {'HEALTH': '-1.650', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.008', 'AMMO4': '0.025', 'AMMO3': '0.043', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.372', 'WEAPON3': '0.400', 'weapon4': '0.444', 'weapon5': '0.814', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '1.884'} +[2023-09-14 12:30:04,170][44162] DAMAGECOUNT value on done: 225.0 +[2023-09-14 12:30:04,170][44162] DAMAGECOUNT value on done: 341.0 +[2023-09-14 12:30:04,171][44162] Sum rewards: 1.209, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.019', 'AMMO3': '0.068', 'AMMO4': '0.093', 'weapon2': '0.170', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.250', 'weapon4': '0.256', 'WEAPON5': '0.300', 'weapon5': '0.302', 'WEAPON3': '0.600', 'weapon3': '2.938'} +[2023-09-14 12:30:04,171][44162] Sum rewards: 4.144, reward structure: {'HEALTH': '-0.270', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.024', 'weapon2': '0.028', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.110', 'weapon6': '0.148', 'WEAPON3': '0.200', 'WEAPON6': '0.200', 'weapon4': '0.320', 'weapon3': '0.956', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000'} +[2023-09-14 12:30:04,707][109198] Fps is (10 sec: 13926.5, 60 sec: 13926.4, 300 sec: 12931.8). Total num frames: 2678784. Throughput: 0: 3452.6. Samples: 409800. Policy #0 lag: (min: 0.0, avg: 1.0, max: 3.0) +[2023-09-14 12:30:04,708][109198] Avg episode reward: [(0, '3.034')] +[2023-09-14 12:30:04,709][44016] Saving new best policy, reward=3.034! +[2023-09-14 12:30:05,657][44091] Updated weights for policy 0, policy_version 658 (0.0012) +[2023-09-14 12:30:08,496][44091] Updated weights for policy 0, policy_version 668 (0.0012) +[2023-09-14 12:30:09,707][109198] Fps is (10 sec: 14745.6, 60 sec: 13994.7, 300 sec: 12999.6). Total num frames: 2752512. Throughput: 0: 3467.0. Samples: 431560. Policy #0 lag: (min: 0.0, avg: 1.0, max: 2.0) +[2023-09-14 12:30:09,708][109198] Avg episode reward: [(0, '3.034')] +[2023-09-14 12:30:09,818][109198] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 109198], exiting... +[2023-09-14 12:30:09,819][44016] Stopping Batcher_0... +[2023-09-14 12:30:09,819][109198] Runner profile tree view: +main_loop: 137.9013 +[2023-09-14 12:30:09,820][44016] Loop batcher_evt_loop terminating... +[2023-09-14 12:30:09,821][44016] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000672_2752512.pth... +[2023-09-14 12:30:09,820][109198] Collected {0: 2752512}, FPS: 12593.8 +[2023-09-14 12:30:09,841][44091] Weights refcount: 2 0 +[2023-09-14 12:30:09,842][44091] Stopping InferenceWorker_p0-w0... +[2023-09-14 12:30:09,843][44091] Loop inference_proc0-0_evt_loop terminating... +[2023-09-14 12:30:09,873][44016] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000248_1015808.pth +[2023-09-14 12:30:09,879][44016] Stopping LearnerWorker_p0... +[2023-09-14 12:30:09,880][44016] Loop learner_proc0_evt_loop terminating... +[2023-09-14 12:30:10,625][44159] Stopping RolloutWorker_w3... +[2023-09-14 12:30:10,626][44159] Loop rollout_proc3_evt_loop terminating... +[2023-09-14 12:30:10,626][44162] Stopping RolloutWorker_w7... +[2023-09-14 12:30:10,626][44162] Loop rollout_proc7_evt_loop terminating... +[2023-09-14 12:30:10,629][44123] Stopping RolloutWorker_w1... +[2023-09-14 12:30:10,630][44123] Loop rollout_proc1_evt_loop terminating... +[2023-09-14 12:30:10,630][44158] Stopping RolloutWorker_w5... +[2023-09-14 12:30:10,630][44161] Stopping RolloutWorker_w6... +[2023-09-14 12:30:10,630][44125] Stopping RolloutWorker_w2... +[2023-09-14 12:30:10,631][44090] Stopping RolloutWorker_w0... +[2023-09-14 12:30:10,631][44160] Stopping RolloutWorker_w4... +[2023-09-14 12:30:10,631][44161] Loop rollout_proc6_evt_loop terminating... +[2023-09-14 12:30:10,631][44090] Loop rollout_proc0_evt_loop terminating... +[2023-09-14 12:30:10,631][44125] Loop rollout_proc2_evt_loop terminating... +[2023-09-14 12:30:10,631][44158] Loop rollout_proc5_evt_loop terminating... +[2023-09-14 12:30:10,632][44160] Loop rollout_proc4_evt_loop terminating... +[2023-09-14 12:30:12,378][109198] Environment doom_basic already registered, overwriting... +[2023-09-14 12:30:12,380][109198] Environment doom_two_colors_easy already registered, overwriting... +[2023-09-14 12:30:12,382][109198] Environment doom_two_colors_hard already registered, overwriting... +[2023-09-14 12:30:12,383][109198] Environment doom_dm already registered, overwriting... +[2023-09-14 12:30:12,385][109198] Environment doom_dwango5 already registered, overwriting... +[2023-09-14 12:30:12,386][109198] Environment doom_my_way_home_flat_actions already registered, overwriting... +[2023-09-14 12:30:12,390][109198] Environment doom_defend_the_center_flat_actions already registered, overwriting... +[2023-09-14 12:30:12,392][109198] Environment doom_my_way_home already registered, overwriting... +[2023-09-14 12:30:12,393][109198] Environment doom_deadly_corridor already registered, overwriting... +[2023-09-14 12:30:12,394][109198] Environment doom_defend_the_center already registered, overwriting... +[2023-09-14 12:30:12,395][109198] Environment doom_defend_the_line already registered, overwriting... +[2023-09-14 12:30:12,396][109198] Environment doom_health_gathering already registered, overwriting... +[2023-09-14 12:30:12,397][109198] Environment doom_health_gathering_supreme already registered, overwriting... +[2023-09-14 12:30:12,397][109198] Environment doom_battle already registered, overwriting... +[2023-09-14 12:30:12,399][109198] Environment doom_battle2 already registered, overwriting... +[2023-09-14 12:30:12,399][109198] Environment doom_duel_bots already registered, overwriting... +[2023-09-14 12:30:12,400][109198] Environment doom_deathmatch_bots already registered, overwriting... +[2023-09-14 12:30:12,401][109198] Environment doom_duel already registered, overwriting... +[2023-09-14 12:30:12,402][109198] Environment doom_deathmatch_full already registered, overwriting... +[2023-09-14 12:30:12,403][109198] Environment doom_benchmark already registered, overwriting... +[2023-09-14 12:30:12,404][109198] register_encoder_factory: +[2023-09-14 12:30:12,426][109198] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json +[2023-09-14 12:30:12,430][109198] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists! +[2023-09-14 12:30:12,431][109198] Resuming existing experiment from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment... +[2023-09-14 12:30:12,432][109198] Weights and Biases integration disabled +[2023-09-14 12:30:12,435][109198] Environment var CUDA_VISIBLE_DEVICES is 0,1 + +[2023-09-14 12:30:14,445][109198] Starting experiment with the following configuration: +help=False +algo=APPO +env=doom_duel +experiment=default_experiment +train_dir=/home/cogstack/Documents/optuna/environments/sample_factory/train_dir +restart_behavior=resume +device=gpu +seed=None +num_policies=2 +async_rl=True +serial_mode=False +batched_sampling=False +num_batches_to_accumulate=2 +worker_num_splits=2 +policy_workers_per_policy=1 +max_policy_lag=1000 +num_workers=8 +num_envs_per_worker=4 +batch_size=1024 +num_batches_per_epoch=1 +num_epochs=1 +rollout=32 +recurrence=32 +shuffle_minibatches=False +gamma=0.99 +reward_scale=1.0 +reward_clip=1000.0 +value_bootstrap=False +normalize_returns=True +exploration_loss_coeff=0.001 +value_loss_coeff=0.5 +kl_loss_coeff=0.0 +exploration_loss=symmetric_kl +gae_lambda=0.95 +ppo_clip_ratio=0.1 +ppo_clip_value=0.2 +with_vtrace=False +vtrace_rho=1.0 +vtrace_c=1.0 +optimizer=adam +adam_eps=1e-06 +adam_beta1=0.9 +adam_beta2=0.999 +max_grad_norm=4.0 +learning_rate=0.0001 +lr_schedule=constant +lr_schedule_kl_threshold=0.008 +lr_adaptive_min=1e-06 +lr_adaptive_max=0.01 +obs_subtract_mean=0.0 +obs_scale=255.0 +normalize_input=True +normalize_input_keys=None +decorrelate_experience_max_seconds=0 +decorrelate_envs_on_one_worker=True +actor_worker_gpus=[] +set_workers_cpu_affinity=True +force_envs_single_thread=False +default_niceness=0 +log_to_file=True +experiment_summaries_interval=10 +flush_summaries_interval=30 +stats_avg=100 +summaries_use_frameskip=True +heartbeat_interval=20 +heartbeat_reporting_interval=600 +train_for_env_steps=10000000 +train_for_seconds=10000000000 +save_every_sec=120 +keep_checkpoints=2 +load_checkpoint_kind=latest +save_milestones_sec=-1 +save_best_every_sec=5 +save_best_metric=reward +save_best_after=100000 +benchmark=False +encoder_mlp_layers=[512, 512] +encoder_conv_architecture=convnet_simple +encoder_conv_mlp_layers=[512] +use_rnn=True +rnn_size=512 +rnn_type=gru +rnn_num_layers=1 +decoder_mlp_layers=[] +nonlinearity=elu +policy_initialization=orthogonal +policy_init_gain=1.0 +actor_critic_share_weights=True +adaptive_stddev=True +continuous_tanh_scale=0.0 +initial_stddev=1.0 +use_env_info_cache=False +env_gpu_actions=False +env_gpu_observations=True +env_frameskip=4 +env_framestack=1 +pixel_format=CHW +use_record_episode_statistics=False +with_wandb=False +wandb_user=None +wandb_project=sample_factory +wandb_group=None +wandb_job_type=SF +wandb_tags=[] +with_pbt=False +pbt_mix_policies_in_one_env=True +pbt_period_env_steps=5000000 +pbt_start_mutation=20000000 +pbt_replace_fraction=0.3 +pbt_mutation_rate=0.15 +pbt_replace_reward_gap=0.1 +pbt_replace_reward_gap_absolute=1e-06 +pbt_optimize_gamma=False +pbt_target_objective=true_objective +pbt_perturb_min=1.1 +pbt_perturb_max=1.5 +num_agents=-1 +num_humans=0 +num_bots=-1 +start_bot_difficulty=None +timelimit=None +res_w=128 +res_h=72 +wide_aspect_ratio=False +eval_env_frameskip=1 +fps=35 +command_line=--env=doom_dm --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=20000000 +cli_args={'env': 'doom_dm', 'num_workers': 8, 'num_envs_per_worker': 4, 'train_for_env_steps': 20000000} +git_hash=20b6d44612dad7d171f23e13b1f3b4c5e5631cf9 +git_repo_name=https://github.com/MattStammers/optuna.git +[2023-09-14 12:30:14,448][109198] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... +[2023-09-14 12:30:14,567][109198] Rollout worker 0 uses device cpu +[2023-09-14 12:30:14,569][109198] Rollout worker 1 uses device cpu +[2023-09-14 12:30:14,571][109198] Rollout worker 2 uses device cpu +[2023-09-14 12:30:14,572][109198] Rollout worker 3 uses device cpu +[2023-09-14 12:30:14,574][109198] Rollout worker 4 uses device cpu +[2023-09-14 12:30:14,575][109198] Rollout worker 5 uses device cpu +[2023-09-14 12:30:14,576][109198] Rollout worker 6 uses device cpu +[2023-09-14 12:30:14,577][109198] Rollout worker 7 uses device cpu +[2023-09-14 12:30:14,641][109198] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:30:14,642][109198] InferenceWorker_p0-w0: min num requests: 1 +[2023-09-14 12:30:14,646][109198] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:30:14,646][109198] InferenceWorker_p1-w0: min num requests: 1 +[2023-09-14 12:30:14,677][109198] Starting all processes... +[2023-09-14 12:30:14,678][109198] Starting process learner_proc0 +[2023-09-14 12:30:16,264][109198] Starting process learner_proc1 +[2023-09-14 12:30:16,266][53511] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:30:16,266][53511] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 +[2023-09-14 12:30:16,284][53511] Num visible devices: 1 +[2023-09-14 12:30:16,305][53511] Starting seed is not provided +[2023-09-14 12:30:16,306][53511] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:30:16,306][53511] Initializing actor-critic model on device cuda:0 +[2023-09-14 12:30:16,306][53511] RunningMeanStd input shape: (23,) +[2023-09-14 12:30:16,307][53511] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:30:16,307][53511] RunningMeanStd input shape: (1,) +[2023-09-14 12:30:16,319][53511] ConvEncoder: input_channels=3 +[2023-09-14 12:30:16,449][53511] Conv encoder output size: 512 +[2023-09-14 12:30:16,450][53511] Policy head output size: 640 +[2023-09-14 12:30:16,467][53511] Created Actor Critic model with architecture: +[2023-09-14 12:30:16,468][53511] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (measurements): RunningMeanStdInPlace() + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): VizdoomEncoder( + (basic_encoder): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ELU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ELU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ELU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ELU) + ) + ) + ) + (measurements_head): Sequential( + (0): Linear(in_features=23, out_features=128, bias=True) + (1): ELU(alpha=1.0) + (2): Linear(in_features=128, out_features=128, bias=True) + (3): ELU(alpha=1.0) + ) + ) + (core): ModelCoreRNN( + (core): GRU(640, 512) + ) + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=41, bias=True) + ) +) +[2023-09-14 12:30:17,346][53511] Using optimizer +[2023-09-14 12:30:17,346][53511] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000672_2752512.pth... +[2023-09-14 12:30:17,379][53511] Loading model from checkpoint +[2023-09-14 12:30:17,384][53511] Loaded experiment state at self.train_step=672, self.env_steps=2752512 +[2023-09-14 12:30:17,384][53511] Initialized policy 0 weights for model version 672 +[2023-09-14 12:30:17,386][53511] LearnerWorker_p0 finished initialization! +[2023-09-14 12:30:17,386][53511] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:30:17,874][53585] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:30:17,873][109198] Starting all processes... +[2023-09-14 12:30:17,874][53585] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for learning process 1 +[2023-09-14 12:30:17,879][109198] Starting process inference_proc0-0 +[2023-09-14 12:30:17,880][109198] Starting process inference_proc1-0 +[2023-09-14 12:30:17,893][53585] Num visible devices: 1 +[2023-09-14 12:30:17,881][109198] Starting process rollout_proc0 +[2023-09-14 12:30:17,881][109198] Starting process rollout_proc1 +[2023-09-14 12:30:17,881][109198] Starting process rollout_proc2 +[2023-09-14 12:30:17,882][109198] Starting process rollout_proc3 +[2023-09-14 12:30:17,885][109198] Starting process rollout_proc4 +[2023-09-14 12:30:17,919][53585] Starting seed is not provided +[2023-09-14 12:30:17,919][53585] Using GPUs [0] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:30:17,920][53585] Initializing actor-critic model on device cuda:0 +[2023-09-14 12:30:17,920][53585] RunningMeanStd input shape: (23,) +[2023-09-14 12:30:17,920][53585] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:30:17,921][53585] RunningMeanStd input shape: (1,) +[2023-09-14 12:30:17,894][109198] Starting process rollout_proc5 +[2023-09-14 12:30:17,934][53585] ConvEncoder: input_channels=3 +[2023-09-14 12:30:17,897][109198] Starting process rollout_proc6 +[2023-09-14 12:30:17,897][109198] Starting process rollout_proc7 +[2023-09-14 12:30:18,157][53585] Conv encoder output size: 512 +[2023-09-14 12:30:18,159][53585] Policy head output size: 640 +[2023-09-14 12:30:18,189][53585] Created Actor Critic model with architecture: +[2023-09-14 12:30:18,189][53585] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (measurements): RunningMeanStdInPlace() + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): VizdoomEncoder( + (basic_encoder): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ELU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ELU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ELU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ELU) + ) + ) + ) + (measurements_head): Sequential( + (0): Linear(in_features=23, out_features=128, bias=True) + (1): ELU(alpha=1.0) + (2): Linear(in_features=128, out_features=128, bias=True) + (3): ELU(alpha=1.0) + ) + ) + (core): ModelCoreRNN( + (core): GRU(640, 512) + ) + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=41, bias=True) + ) +) +[2023-09-14 12:30:19,431][53585] Using optimizer +[2023-09-14 12:30:19,432][53585] No checkpoints found +[2023-09-14 12:30:19,432][53585] Did not load from checkpoint, starting from scratch! +[2023-09-14 12:30:19,432][53585] Initialized policy 1 weights for model version 0 +[2023-09-14 12:30:19,434][53585] LearnerWorker_p1 finished initialization! +[2023-09-14 12:30:19,434][53585] Using GPUs [0] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:30:19,931][53811] Worker 6 uses CPU cores [24, 25, 26, 27] +[2023-09-14 12:30:19,972][53806] Worker 1 uses CPU cores [4, 5, 6, 7] +[2023-09-14 12:30:20,112][53808] Worker 4 uses CPU cores [16, 17, 18, 19] +[2023-09-14 12:30:20,155][53805] Worker 2 uses CPU cores [8, 9, 10, 11] +[2023-09-14 12:30:20,299][53809] Worker 5 uses CPU cores [20, 21, 22, 23] +[2023-09-14 12:30:20,319][53801] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:30:20,319][53801] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 +[2023-09-14 12:30:20,335][53810] Worker 7 uses CPU cores [28, 29, 30, 31] +[2023-09-14 12:30:20,338][53801] Num visible devices: 1 +[2023-09-14 12:30:20,351][53807] Worker 3 uses CPU cores [12, 13, 14, 15] +[2023-09-14 12:30:20,427][53802] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:30:20,427][53802] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for inference process 1 +[2023-09-14 12:30:20,442][53804] Worker 0 uses CPU cores [0, 1, 2, 3] +[2023-09-14 12:30:20,447][53802] Num visible devices: 1 +[2023-09-14 12:30:20,963][53801] RunningMeanStd input shape: (23,) +[2023-09-14 12:30:20,964][53801] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:30:20,964][53801] RunningMeanStd input shape: (1,) +[2023-09-14 12:30:20,976][53801] ConvEncoder: input_channels=3 +[2023-09-14 12:30:21,080][53801] Conv encoder output size: 512 +[2023-09-14 12:30:21,081][53801] Policy head output size: 640 +[2023-09-14 12:30:21,187][53802] RunningMeanStd input shape: (23,) +[2023-09-14 12:30:21,188][53802] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:30:21,188][53802] RunningMeanStd input shape: (1,) +[2023-09-14 12:30:21,200][53802] ConvEncoder: input_channels=3 +[2023-09-14 12:30:21,306][53802] Conv encoder output size: 512 +[2023-09-14 12:30:21,307][53802] Policy head output size: 640 +[2023-09-14 12:30:21,447][109198] Inference worker 0-0 is ready! +[2023-09-14 12:30:21,586][109198] Inference worker 1-0 is ready! +[2023-09-14 12:30:21,588][109198] All inference workers are ready! Signal rollout workers to start! +[2023-09-14 12:30:21,591][53810] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,592][53805] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,592][53808] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,592][53806] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,592][53807] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,594][53811] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,594][53809] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,595][53804] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,622][53805] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:30:21,625][53805] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,626][53810] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:30:21,627][53811] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:30:21,628][53809] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:30:21,628][53804] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:30:21,629][53810] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,630][53811] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,631][53809] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,631][53804] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,639][53806] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:30:21,639][53807] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:30:21,639][53808] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:30:21,643][53806] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,643][53807] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,643][53808] Multi agent env, num agents: 2 +[2023-09-14 12:30:21,654][53805] Port 40500 is available +[2023-09-14 12:30:21,654][53805] Using port 40500 +[2023-09-14 12:30:21,655][53805] Initializing env for player 0, init_info: {'port': 40500}... +[2023-09-14 12:30:21,659][53810] UDP port 41000 cannot be used [Errno 98] Address already in use +[2023-09-14 12:30:21,659][53810] Port 42000 is available +[2023-09-14 12:30:21,659][53810] Using port 42000 +[2023-09-14 12:30:21,659][53811] Port 40900 is available +[2023-09-14 12:30:21,659][53811] Using port 40900 +[2023-09-14 12:30:21,660][53810] Initializing env for player 0, init_info: {'port': 42000}... +[2023-09-14 12:30:21,661][53809] Port 40800 is available +[2023-09-14 12:30:21,661][53809] Using port 40800 +[2023-09-14 12:30:21,662][53804] Port 40300 is available +[2023-09-14 12:30:21,662][53804] Using port 40300 +[2023-09-14 12:30:21,689][53807] Port 40600 is available +[2023-09-14 12:30:21,689][53808] Port 40700 is available +[2023-09-14 12:30:21,689][53806] Port 40400 is available +[2023-09-14 12:30:21,689][53807] Using port 40600 +[2023-09-14 12:30:21,689][53808] Using port 40700 +[2023-09-14 12:30:21,689][53806] Using port 40400 +[2023-09-14 12:30:21,689][53805] Using port 40500 on host... +[2023-09-14 12:30:21,690][53807] Initializing env for player 0, init_info: {'port': 40600}... +[2023-09-14 12:30:21,690][53808] Initializing env for player 0, init_info: {'port': 40700}... +[2023-09-14 12:30:21,690][53806] Initializing env for player 0, init_info: {'port': 40400}... +[2023-09-14 12:30:21,695][53810] Using port 42000 on host... +[2023-09-14 12:30:21,711][53810] Initializing env for player 1, init_info: {'port': 42000}... +[2023-09-14 12:30:21,719][53805] Initializing env for player 1, init_info: {'port': 40500}... +[2023-09-14 12:30:21,722][53808] Using port 40700 on host... +[2023-09-14 12:30:21,725][53806] Using port 40400 on host... +[2023-09-14 12:30:21,728][53807] Using port 40600 on host... +[2023-09-14 12:30:21,740][53808] Initializing env for player 1, init_info: {'port': 40700}... +[2023-09-14 12:30:21,740][53806] Initializing env for player 1, init_info: {'port': 40400}... +[2023-09-14 12:30:21,740][53807] Initializing env for player 1, init_info: {'port': 40600}... +[2023-09-14 12:30:22,436][109198] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 2752512. Throughput: 0: nan, 1: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:30:22,795][53805] Initialized w:2 v:0 player:1 +[2023-09-14 12:30:22,796][53805] Initialized w:2 v:0 player:0 +[2023-09-14 12:30:22,799][53805] 2 agent workers initialized for env 2! +[2023-09-14 12:30:22,803][53808] Initialized w:4 v:0 player:1 +[2023-09-14 12:30:22,804][53808] Initialized w:4 v:0 player:0 +[2023-09-14 12:30:22,805][53808] 2 agent workers initialized for env 4! +[2023-09-14 12:30:22,814][53805] Decorrelating experience for 0 frames... +[2023-09-14 12:30:22,815][53808] Decorrelating experience for 0 frames... +[2023-09-14 12:30:22,815][53805] Port 40501 is available +[2023-09-14 12:30:22,815][53805] Using port 40501 +[2023-09-14 12:30:22,815][53808] Port 40701 is available +[2023-09-14 12:30:22,816][53808] Using port 40701 +[2023-09-14 12:30:22,816][53805] Initializing env for player 0, init_info: {'port': 40501}... +[2023-09-14 12:30:22,816][53808] Initializing env for player 0, init_info: {'port': 40701}... +[2023-09-14 12:30:22,822][53811] Initializing env for player 0, init_info: {'port': 40900}... +[2023-09-14 12:30:22,844][53805] Using port 40501 on host... +[2023-09-14 12:30:22,845][53808] Using port 40701 on host... +[2023-09-14 12:30:22,851][53811] Using port 40900 on host... +[2023-09-14 12:30:22,866][53805] Initializing env for player 1, init_info: {'port': 40501}... +[2023-09-14 12:30:22,867][53808] Initializing env for player 1, init_info: {'port': 40701}... +[2023-09-14 12:30:22,871][53810] Initialized w:7 v:0 player:0 +[2023-09-14 12:30:22,872][53810] Initialized w:7 v:0 player:1 +[2023-09-14 12:30:22,873][53811] Initializing env for player 1, init_info: {'port': 40900}... +[2023-09-14 12:30:22,874][53810] 2 agent workers initialized for env 7! +[2023-09-14 12:30:22,885][53810] Decorrelating experience for 0 frames... +[2023-09-14 12:30:22,888][53810] UDP port 41001 cannot be used [Errno 98] Address already in use +[2023-09-14 12:30:22,888][53810] Port 42001 is available +[2023-09-14 12:30:22,889][53810] Using port 42001 +[2023-09-14 12:30:22,913][53807] Initialized w:3 v:0 player:0 +[2023-09-14 12:30:22,914][53807] Initialized w:3 v:0 player:1 +[2023-09-14 12:30:22,915][53807] 2 agent workers initialized for env 3! +[2023-09-14 12:30:22,925][53807] Decorrelating experience for 0 frames... +[2023-09-14 12:30:22,926][53807] Port 40601 is available +[2023-09-14 12:30:22,925][53806] Initialized w:1 v:0 player:1 +[2023-09-14 12:30:22,926][53807] Using port 40601 +[2023-09-14 12:30:22,926][53806] Initialized w:1 v:0 player:0 +[2023-09-14 12:30:22,927][53807] Initializing env for player 0, init_info: {'port': 40601}... +[2023-09-14 12:30:22,929][53806] 2 agent workers initialized for env 1! +[2023-09-14 12:30:22,941][53810] Initializing env for player 0, init_info: {'port': 42001}... +[2023-09-14 12:30:22,946][53806] Decorrelating experience for 0 frames... +[2023-09-14 12:30:22,947][53806] Port 40401 is available +[2023-09-14 12:30:22,948][53806] Using port 40401 +[2023-09-14 12:30:22,948][53806] Initializing env for player 0, init_info: {'port': 40401}... +[2023-09-14 12:30:22,971][53810] Using port 42001 on host... +[2023-09-14 12:30:22,972][53807] Using port 40601 on host... +[2023-09-14 12:30:22,978][53806] Using port 40401 on host... +[2023-09-14 12:30:22,978][53807] Initializing env for player 1, init_info: {'port': 40601}... +[2023-09-14 12:30:22,992][53810] Initializing env for player 1, init_info: {'port': 42001}... +[2023-09-14 12:30:22,999][53806] Initializing env for player 1, init_info: {'port': 40401}... +[2023-09-14 12:30:23,888][53805] Initialized w:2 v:1 player:0 +[2023-09-14 12:30:23,889][53805] Initialized w:2 v:1 player:1 +[2023-09-14 12:30:23,890][53805] 2 agent workers initialized for env 2! +[2023-09-14 12:30:23,894][53808] Initialized w:4 v:1 player:0 +[2023-09-14 12:30:23,895][53808] Initialized w:4 v:1 player:1 +[2023-09-14 12:30:23,896][53808] 2 agent workers initialized for env 4! +[2023-09-14 12:30:23,904][53808] Decorrelating experience for 32 frames... +[2023-09-14 12:30:23,905][53805] Decorrelating experience for 32 frames... +[2023-09-14 12:30:23,964][53808] Multi agent env, num agents: 2 +[2023-09-14 12:30:23,970][53805] Multi agent env, num agents: 2 +[2023-09-14 12:30:23,985][53811] Initialized w:6 v:0 player:1 +[2023-09-14 12:30:23,988][53811] Initialized w:6 v:0 player:0 +[2023-09-14 12:30:23,988][53811] 2 agent workers initialized for env 6! +[2023-09-14 12:30:23,994][53808] Multi agent env, num agents: 2 +[2023-09-14 12:30:24,000][53811] Decorrelating experience for 0 frames... +[2023-09-14 12:30:24,001][53811] Port 40901 is available +[2023-09-14 12:30:24,002][53811] Using port 40901 +[2023-09-14 12:30:24,009][53805] Multi agent env, num agents: 2 +[2023-09-14 12:30:24,022][53808] Port 40702 is available +[2023-09-14 12:30:24,023][53808] Using port 40702 +[2023-09-14 12:30:24,023][53808] Initializing env for player 0, init_info: {'port': 40702}... +[2023-09-14 12:30:24,033][53809] Initializing env for player 0, init_info: {'port': 40800}... +[2023-09-14 12:30:24,037][53805] Port 40502 is available +[2023-09-14 12:30:24,037][53805] Using port 40502 +[2023-09-14 12:30:24,041][53810] Initialized w:7 v:1 player:1 +[2023-09-14 12:30:24,041][53810] Initialized w:7 v:1 player:0 +[2023-09-14 12:30:24,043][53810] 2 agent workers initialized for env 7! +[2023-09-14 12:30:24,051][53810] Decorrelating experience for 32 frames... +[2023-09-14 12:30:24,058][53808] Using port 40702 on host... +[2023-09-14 12:30:24,072][53809] Using port 40800 on host... +[2023-09-14 12:30:24,074][53808] Initializing env for player 1, init_info: {'port': 40702}... +[2023-09-14 12:30:24,087][53809] Initializing env for player 1, init_info: {'port': 40800}... +[2023-09-14 12:30:24,113][53810] Multi agent env, num agents: 2 +[2023-09-14 12:30:24,130][53806] Initialized w:1 v:1 player:0 +[2023-09-14 12:30:24,131][53806] Initialized w:1 v:1 player:1 +[2023-09-14 12:30:24,132][53806] 2 agent workers initialized for env 1! +[2023-09-14 12:30:24,139][53807] Initialized w:3 v:1 player:1 +[2023-09-14 12:30:24,139][53807] Initialized w:3 v:1 player:0 +[2023-09-14 12:30:24,140][53807] 2 agent workers initialized for env 3! +[2023-09-14 12:30:24,142][53806] Decorrelating experience for 32 frames... +[2023-09-14 12:30:24,143][53810] Multi agent env, num agents: 2 +[2023-09-14 12:30:24,148][53807] Decorrelating experience for 32 frames... +[2023-09-14 12:30:24,154][53811] Initializing env for player 0, init_info: {'port': 40901}... +[2023-09-14 12:30:24,178][53810] UDP port 41002 cannot be used [Errno 98] Address already in use +[2023-09-14 12:30:24,178][53810] Port 42002 is available +[2023-09-14 12:30:24,178][53810] Using port 42002 +[2023-09-14 12:30:24,179][53810] Initializing env for player 0, init_info: {'port': 42002}... +[2023-09-14 12:30:24,205][53811] Initializing env for player 1, init_info: {'port': 40901}... +[2023-09-14 12:30:24,206][53811] Using port 40901 on host... +[2023-09-14 12:30:24,214][53810] Using port 42002 on host... +[2023-09-14 12:30:24,221][53806] Multi agent env, num agents: 2 +[2023-09-14 12:30:24,224][53807] Multi agent env, num agents: 2 +[2023-09-14 12:30:24,231][53810] Initializing env for player 1, init_info: {'port': 42002}... +[2023-09-14 12:30:24,264][53807] Multi agent env, num agents: 2 +[2023-09-14 12:30:24,268][53806] Multi agent env, num agents: 2 +[2023-09-14 12:30:24,313][53806] Port 40402 is available +[2023-09-14 12:30:24,314][53806] Using port 40402 +[2023-09-14 12:30:24,314][53806] Initializing env for player 0, init_info: {'port': 40402}... +[2023-09-14 12:30:24,319][53807] Port 40602 is available +[2023-09-14 12:30:24,319][53807] Using port 40602 +[2023-09-14 12:30:24,320][53807] Initializing env for player 0, init_info: {'port': 40602}... +[2023-09-14 12:30:24,358][53806] Using port 40402 on host... +[2023-09-14 12:30:24,364][53807] Using port 40602 on host... +[2023-09-14 12:30:24,366][53806] Initializing env for player 1, init_info: {'port': 40402}... +[2023-09-14 12:30:24,371][53807] Initializing env for player 1, init_info: {'port': 40602}... +[2023-09-14 12:30:25,109][53808] Initialized w:4 v:2 player:0 +[2023-09-14 12:30:25,110][53808] Initialized w:4 v:2 player:1 +[2023-09-14 12:30:25,112][53808] 2 agent workers initialized for env 4! +[2023-09-14 12:30:25,123][53808] Decorrelating experience for 64 frames... +[2023-09-14 12:30:25,249][53808] Port 40703 is available +[2023-09-14 12:30:25,249][53808] Using port 40703 +[2023-09-14 12:30:25,250][53808] Initializing env for player 0, init_info: {'port': 40703}... +[2023-09-14 12:30:25,265][53809] Initialized w:5 v:0 player:0 +[2023-09-14 12:30:25,265][53809] Initialized w:5 v:0 player:1 +[2023-09-14 12:30:25,268][53809] 2 agent workers initialized for env 5! +[2023-09-14 12:30:25,278][53808] Using port 40703 on host... +[2023-09-14 12:30:25,285][53809] Decorrelating experience for 0 frames... +[2023-09-14 12:30:25,285][53809] Port 40801 is available +[2023-09-14 12:30:25,285][53809] Using port 40801 +[2023-09-14 12:30:25,286][53809] Initializing env for player 0, init_info: {'port': 40801}... +[2023-09-14 12:30:25,297][53811] Initialized w:6 v:1 player:0 +[2023-09-14 12:30:25,298][53811] Initialized w:6 v:1 player:1 +[2023-09-14 12:30:25,300][53811] 2 agent workers initialized for env 6! +[2023-09-14 12:30:25,300][53808] Initializing env for player 1, init_info: {'port': 40703}... +[2023-09-14 12:30:25,303][53805] Initializing env for player 0, init_info: {'port': 40502}... +[2023-09-14 12:30:25,312][53811] Decorrelating experience for 32 frames... +[2023-09-14 12:30:25,316][53809] Using port 40801 on host... +[2023-09-14 12:30:25,336][53809] Initializing env for player 1, init_info: {'port': 40801}... +[2023-09-14 12:30:25,338][53805] Using port 40502 on host... +[2023-09-14 12:30:25,353][53805] Initializing env for player 1, init_info: {'port': 40502}... +[2023-09-14 12:30:25,390][53811] Multi agent env, num agents: 2 +[2023-09-14 12:30:25,404][53806] Initialized w:1 v:2 player:1 +[2023-09-14 12:30:25,405][53806] Initialized w:1 v:2 player:0 +[2023-09-14 12:30:25,406][53806] 2 agent workers initialized for env 1! +[2023-09-14 12:30:25,417][53806] Decorrelating experience for 64 frames... +[2023-09-14 12:30:25,436][53810] Initialized w:7 v:2 player:1 +[2023-09-14 12:30:25,437][53811] Multi agent env, num agents: 2 +[2023-09-14 12:30:25,437][53810] Initialized w:7 v:2 player:0 +[2023-09-14 12:30:25,438][53810] 2 agent workers initialized for env 7! +[2023-09-14 12:30:25,449][53810] Decorrelating experience for 64 frames... +[2023-09-14 12:30:25,477][53807] Initialized w:3 v:2 player:0 +[2023-09-14 12:30:25,477][53807] Initialized w:3 v:2 player:1 +[2023-09-14 12:30:25,479][53807] 2 agent workers initialized for env 3! +[2023-09-14 12:30:25,482][53811] Port 40902 is available +[2023-09-14 12:30:25,483][53811] Using port 40902 +[2023-09-14 12:30:25,483][53811] Initializing env for player 0, init_info: {'port': 40902}... +[2023-09-14 12:30:25,489][53807] Decorrelating experience for 64 frames... +[2023-09-14 12:30:25,512][53811] Using port 40902 on host... +[2023-09-14 12:30:25,534][53811] Initializing env for player 1, init_info: {'port': 40902}... +[2023-09-14 12:30:25,584][53806] Port 40403 is available +[2023-09-14 12:30:25,584][53806] Using port 40403 +[2023-09-14 12:30:25,585][53806] Initializing env for player 0, init_info: {'port': 40403}... +[2023-09-14 12:30:25,610][53810] Port 41003 is available +[2023-09-14 12:30:25,610][53810] Using port 41003 +[2023-09-14 12:30:25,611][53810] Initializing env for player 0, init_info: {'port': 41003}... +[2023-09-14 12:30:25,614][53806] Using port 40403 on host... +[2023-09-14 12:30:25,635][53806] Initializing env for player 1, init_info: {'port': 40403}... +[2023-09-14 12:30:25,648][53810] Using port 41003 on host... +[2023-09-14 12:30:25,651][53807] Port 40603 is available +[2023-09-14 12:30:25,651][53807] Using port 40603 +[2023-09-14 12:30:25,652][53807] Initializing env for player 0, init_info: {'port': 40603}... +[2023-09-14 12:30:25,662][53810] Initializing env for player 1, init_info: {'port': 41003}... +[2023-09-14 12:30:25,680][53807] Using port 40603 on host... +[2023-09-14 12:30:25,702][53807] Initializing env for player 1, init_info: {'port': 40603}... +[2023-09-14 12:30:26,449][53808] Initialized w:4 v:3 player:1 +[2023-09-14 12:30:26,450][53808] Initialized w:4 v:3 player:0 +[2023-09-14 12:30:26,452][53808] 2 agent workers initialized for env 4! +[2023-09-14 12:30:26,466][53808] Decorrelating experience for 96 frames... +[2023-09-14 12:30:26,470][53805] Initialized w:2 v:2 player:1 +[2023-09-14 12:30:26,471][53805] Initialized w:2 v:2 player:0 +[2023-09-14 12:30:26,473][53805] 2 agent workers initialized for env 2! +[2023-09-14 12:30:26,480][53805] Decorrelating experience for 64 frames... +[2023-09-14 12:30:26,518][53804] Initializing env for player 0, init_info: {'port': 40300}... +[2023-09-14 12:30:26,520][53809] Initialized w:5 v:1 player:0 +[2023-09-14 12:30:26,520][53809] Initialized w:5 v:1 player:1 +[2023-09-14 12:30:26,521][53809] 2 agent workers initialized for env 5! +[2023-09-14 12:30:26,532][53809] Decorrelating experience for 32 frames... +[2023-09-14 12:30:26,551][53804] Using port 40300 on host... +[2023-09-14 12:30:26,569][53804] Initializing env for player 1, init_info: {'port': 40300}... +[2023-09-14 12:30:26,579][53811] Initialized w:6 v:2 player:0 +[2023-09-14 12:30:26,580][53811] Initialized w:6 v:2 player:1 +[2023-09-14 12:30:26,581][53811] 2 agent workers initialized for env 6! +[2023-09-14 12:30:26,588][53811] Decorrelating experience for 64 frames... +[2023-09-14 12:30:26,614][53809] Multi agent env, num agents: 2 +[2023-09-14 12:30:26,622][53805] Port 40503 is available +[2023-09-14 12:30:26,622][53805] Using port 40503 +[2023-09-14 12:30:26,623][53805] Initializing env for player 0, init_info: {'port': 40503}... +[2023-09-14 12:30:26,643][53809] Multi agent env, num agents: 2 +[2023-09-14 12:30:26,655][53805] Using port 40503 on host... +[2023-09-14 12:30:26,673][53805] Initializing env for player 1, init_info: {'port': 40503}... +[2023-09-14 12:30:26,677][53806] Initialized w:1 v:3 player:1 +[2023-09-14 12:30:26,677][53806] Initialized w:1 v:3 player:0 +[2023-09-14 12:30:26,678][53809] Port 40802 is available +[2023-09-14 12:30:26,678][53809] Using port 40802 +[2023-09-14 12:30:26,678][53806] 2 agent workers initialized for env 1! +[2023-09-14 12:30:26,679][53809] Initializing env for player 0, init_info: {'port': 40802}... +[2023-09-14 12:30:26,690][53806] Decorrelating experience for 96 frames... +[2023-09-14 12:30:26,715][53809] Using port 40802 on host... +[2023-09-14 12:30:26,731][53809] Initializing env for player 1, init_info: {'port': 40802}... +[2023-09-14 12:30:26,739][53811] Port 40903 is available +[2023-09-14 12:30:26,739][53811] Using port 40903 +[2023-09-14 12:30:26,740][53811] Initializing env for player 0, init_info: {'port': 40903}... +[2023-09-14 12:30:26,768][53811] Using port 40903 on host... +[2023-09-14 12:30:26,790][53811] Initializing env for player 1, init_info: {'port': 40903}... +[2023-09-14 12:30:26,820][53810] Initialized w:7 v:3 player:1 +[2023-09-14 12:30:26,823][53810] Initialized w:7 v:3 player:0 +[2023-09-14 12:30:26,824][53810] 2 agent workers initialized for env 7! +[2023-09-14 12:30:26,823][53807] Initialized w:3 v:3 player:1 +[2023-09-14 12:30:26,824][53807] Initialized w:3 v:3 player:0 +[2023-09-14 12:30:26,826][53807] 2 agent workers initialized for env 3! +[2023-09-14 12:30:26,838][53807] Decorrelating experience for 96 frames... +[2023-09-14 12:30:26,840][53810] Decorrelating experience for 96 frames... +[2023-09-14 12:30:27,435][109198] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 2752512. Throughput: 0: 0.0, 1: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:30:27,625][53804] Initialized w:0 v:0 player:1 +[2023-09-14 12:30:27,625][53804] Initialized w:0 v:0 player:0 +[2023-09-14 12:30:27,627][53804] 2 agent workers initialized for env 0! +[2023-09-14 12:30:27,635][53804] Decorrelating experience for 0 frames... +[2023-09-14 12:30:27,635][53804] Port 40301 is available +[2023-09-14 12:30:27,636][53804] Using port 40301 +[2023-09-14 12:30:27,636][53804] Initializing env for player 0, init_info: {'port': 40301}... +[2023-09-14 12:30:27,670][53804] Using port 40301 on host... +[2023-09-14 12:30:27,686][53804] Initializing env for player 1, init_info: {'port': 40301}... +[2023-09-14 12:30:27,730][53805] Initialized w:2 v:3 player:1 +[2023-09-14 12:30:27,731][53805] Initialized w:2 v:3 player:0 +[2023-09-14 12:30:27,732][53805] 2 agent workers initialized for env 2! +[2023-09-14 12:30:27,745][53805] Decorrelating experience for 96 frames... +[2023-09-14 12:30:27,857][53811] Initialized w:6 v:3 player:0 +[2023-09-14 12:30:27,857][53811] Initialized w:6 v:3 player:1 +[2023-09-14 12:30:27,859][53811] 2 agent workers initialized for env 6! +[2023-09-14 12:30:27,860][53809] Initialized w:5 v:2 player:1 +[2023-09-14 12:30:27,860][53809] Initialized w:5 v:2 player:0 +[2023-09-14 12:30:27,862][53809] 2 agent workers initialized for env 5! +[2023-09-14 12:30:27,868][53811] Decorrelating experience for 96 frames... +[2023-09-14 12:30:27,872][53809] Decorrelating experience for 64 frames... +[2023-09-14 12:30:28,081][53809] Port 40803 is available +[2023-09-14 12:30:28,081][53809] Using port 40803 +[2023-09-14 12:30:28,081][53809] Initializing env for player 0, init_info: {'port': 40803}... +[2023-09-14 12:30:28,121][53809] Using port 40803 on host... +[2023-09-14 12:30:28,132][53809] Initializing env for player 1, init_info: {'port': 40803}... +[2023-09-14 12:30:28,780][53804] Initialized w:0 v:1 player:1 +[2023-09-14 12:30:28,780][53804] Initialized w:0 v:1 player:0 +[2023-09-14 12:30:28,782][53804] 2 agent workers initialized for env 0! +[2023-09-14 12:30:28,791][53804] Decorrelating experience for 32 frames... +[2023-09-14 12:30:28,871][53804] Multi agent env, num agents: 2 +[2023-09-14 12:30:28,916][53804] Multi agent env, num agents: 2 +[2023-09-14 12:30:28,960][53804] Port 40302 is available +[2023-09-14 12:30:28,960][53804] Using port 40302 +[2023-09-14 12:30:28,960][53804] Initializing env for player 0, init_info: {'port': 40302}... +[2023-09-14 12:30:28,995][53804] Using port 40302 on host... +[2023-09-14 12:30:29,011][53804] Initializing env for player 1, init_info: {'port': 40302}... +[2023-09-14 12:30:29,215][53809] Initialized w:5 v:3 player:0 +[2023-09-14 12:30:29,216][53809] Initialized w:5 v:3 player:1 +[2023-09-14 12:30:29,217][53809] 2 agent workers initialized for env 5! +[2023-09-14 12:30:29,233][53809] Decorrelating experience for 96 frames... +[2023-09-14 12:30:30,115][53804] Initialized w:0 v:2 player:1 +[2023-09-14 12:30:30,115][53804] Initialized w:0 v:2 player:0 +[2023-09-14 12:30:30,116][53804] 2 agent workers initialized for env 0! +[2023-09-14 12:30:30,125][53804] Decorrelating experience for 64 frames... +[2023-09-14 12:30:30,338][53804] Port 40303 is available +[2023-09-14 12:30:30,339][53804] Using port 40303 +[2023-09-14 12:30:30,339][53804] Initializing env for player 0, init_info: {'port': 40303}... +[2023-09-14 12:30:30,368][53804] Using port 40303 on host... +[2023-09-14 12:30:30,390][53804] Initializing env for player 1, init_info: {'port': 40303}... +[2023-09-14 12:30:30,484][53585] Signal inference workers to stop experience collection... +[2023-09-14 12:30:30,515][53801] InferenceWorker_p0-w0: stopping experience collection +[2023-09-14 12:30:30,517][53802] InferenceWorker_p1-w0: stopping experience collection +[2023-09-14 12:30:30,774][53511] Signal inference workers to stop experience collection... +[2023-09-14 12:30:31,424][53804] Initialized w:0 v:3 player:1 +[2023-09-14 12:30:31,424][53804] Initialized w:0 v:3 player:0 +[2023-09-14 12:30:31,425][53804] 2 agent workers initialized for env 0! +[2023-09-14 12:30:31,437][53804] Decorrelating experience for 96 frames... +[2023-09-14 12:30:32,140][53511] Signal inference workers to resume experience collection... +[2023-09-14 12:30:32,141][53801] InferenceWorker_p0-w0: resuming experience collection +[2023-09-14 12:30:32,141][53802] InferenceWorker_p1-w0: resuming experience collection +[2023-09-14 12:30:32,156][53585] Signal inference workers to resume experience collection... +[2023-09-14 12:30:32,435][109198] Fps is (10 sec: 819.2, 60 sec: 819.2, 300 sec: 819.2). Total num frames: 2760704. Throughput: 0: 288.1, 1: 271.2. Samples: 5593. Policy #0 lag: (min: 0.0, avg: 0.0, max: 0.0) +[2023-09-14 12:30:34,628][109198] Heartbeat connected on Batcher_0 +[2023-09-14 12:30:34,631][109198] Heartbeat connected on LearnerWorker_p0 +[2023-09-14 12:30:34,634][109198] Heartbeat connected on Batcher_1 +[2023-09-14 12:30:34,637][109198] Heartbeat connected on LearnerWorker_p1 +[2023-09-14 12:30:34,646][109198] Heartbeat connected on InferenceWorker_p0-w0 +[2023-09-14 12:30:34,654][109198] Heartbeat connected on InferenceWorker_p1-w0 +[2023-09-14 12:30:34,666][109198] Heartbeat connected on RolloutWorker_w1 +[2023-09-14 12:30:34,677][109198] Heartbeat connected on RolloutWorker_w0 +[2023-09-14 12:30:34,679][109198] Heartbeat connected on RolloutWorker_w5 +[2023-09-14 12:30:34,683][109198] Heartbeat connected on RolloutWorker_w3 +[2023-09-14 12:30:34,684][109198] Heartbeat connected on RolloutWorker_w2 +[2023-09-14 12:30:34,686][109198] Heartbeat connected on RolloutWorker_w7 +[2023-09-14 12:30:34,687][109198] Heartbeat connected on RolloutWorker_w4 +[2023-09-14 12:30:34,689][109198] Heartbeat connected on RolloutWorker_w6 +[2023-09-14 12:30:34,809][53807] Large shaping reward 2.602 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 1.0), ('DAMAGECOUNT', 1.6, 160.0), ('weapon5', 0.002)] +[2023-09-14 12:30:37,300][53801] Updated weights for policy 0, policy_version 682 (0.0681) +[2023-09-14 12:30:37,435][109198] Fps is (10 sec: 7782.4, 60 sec: 5188.4, 300 sec: 5188.4). Total num frames: 2830336. Throughput: 0: 623.6, 1: 559.8. Samples: 17751. Policy #0 lag: (min: 0.0, avg: 0.4, max: 3.0) +[2023-09-14 12:30:38,205][53802] Updated weights for policy 1, policy_version 10 (0.0656) +[2023-09-14 12:30:42,435][109198] Fps is (10 sec: 13516.7, 60 sec: 7168.1, 300 sec: 7168.1). Total num frames: 2895872. Throughput: 0: 750.7, 1: 653.5. Samples: 28083. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:30:42,525][53801] Updated weights for policy 0, policy_version 692 (0.0012) +[2023-09-14 12:30:44,633][53802] Updated weights for policy 1, policy_version 20 (0.0012) +[2023-09-14 12:30:47,435][109198] Fps is (10 sec: 13516.8, 60 sec: 8519.8, 300 sec: 8519.8). Total num frames: 2965504. Throughput: 0: 1051.6, 1: 899.3. Samples: 48772. Policy #0 lag: (min: 0.0, avg: 0.7, max: 3.0) +[2023-09-14 12:30:48,105][53801] Updated weights for policy 0, policy_version 702 (0.0012) +[2023-09-14 12:30:51,189][53802] Updated weights for policy 1, policy_version 30 (0.0012) +[2023-09-14 12:30:52,435][109198] Fps is (10 sec: 13926.6, 60 sec: 9420.9, 300 sec: 9420.9). Total num frames: 3035136. Throughput: 0: 1251.2, 1: 1065.3. Samples: 69497. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:30:53,578][53801] Updated weights for policy 0, policy_version 712 (0.0012) +[2023-09-14 12:30:57,435][109198] Fps is (10 sec: 13516.8, 60 sec: 9947.5, 300 sec: 9947.5). Total num frames: 3100672. Throughput: 0: 1232.5, 1: 1044.0. Samples: 79676. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:30:57,711][53802] Updated weights for policy 1, policy_version 40 (0.0012) +[2023-09-14 12:30:59,387][53801] Updated weights for policy 0, policy_version 722 (0.0014) +[2023-09-14 12:31:02,435][109198] Fps is (10 sec: 13107.2, 60 sec: 10342.5, 300 sec: 10342.5). Total num frames: 3166208. Throughput: 0: 1347.6, 1: 1141.2. Samples: 99551. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:31:03,574][53805] DAMAGECOUNT value on done: 5.0 +[2023-09-14 12:31:03,575][53805] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:03,854][53805] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:31:03,949][53809] Large shaping reward 2.542 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 2.0), ('DAMAGECOUNT', 1.54, 154.0), ('weapon5', 0.002)] +[2023-09-14 12:31:04,185][53805] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:04,185][53805] DAMAGECOUNT value on done: 40.0 +[2023-09-14 12:31:04,185][53805] Sum rewards: -1.641, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'FRAGCOUNT': '-0.002', 'AMMO5': '0.007', 'AMMO2': '0.024', 'AMMO3': '0.097', 'AMMO4': '0.120', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.216', 'weapon3': '0.228', 'weapon4': '0.346', 'weapon2': '0.422', 'WEAPON3': '0.500'} +[2023-09-14 12:31:04,186][53805] Sum rewards: 1.004, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.005', 'AMMO4': '0.018', 'AMMO3': '0.068', 'weapon5': '0.072', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.164', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.400', 'weapon3': '0.688', 'weapon2': '0.986'} +[2023-09-14 12:31:04,510][53802] Updated weights for policy 1, policy_version 50 (0.0012) +[2023-09-14 12:31:04,785][53801] Updated weights for policy 0, policy_version 732 (0.0013) +[2023-09-14 12:31:05,511][53811] DAMAGECOUNT value on done: 168.0 +[2023-09-14 12:31:05,512][53811] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:05,512][53811] Sum rewards: 4.469, reward structure: {'HEALTH': '-1.220', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.039', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.254', 'weapon2': '0.346', 'weapon5': '0.354', 'WEAPON3': '0.400', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.680', 'weapon3': '2.342'} +[2023-09-14 12:31:06,043][53811] DAMAGECOUNT value on done: 109.0 +[2023-09-14 12:31:06,044][53811] DAMAGECOUNT value on done: 122.0 +[2023-09-14 12:31:06,044][53811] Sum rewards: 3.446, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.014', 'weapon4': '0.020', 'AMMO3': '0.040', 'AMMO4': '0.071', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.202', 'weapon2': '0.370', 'WEAPON3': '0.400', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.090', 'weapon3': '2.532'} +[2023-09-14 12:31:07,269][53807] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:07,269][53807] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:07,435][109198] Fps is (10 sec: 13926.5, 60 sec: 10831.7, 300 sec: 10831.7). Total num frames: 3239936. Throughput: 0: 1461.1, 1: 1220.5. Samples: 120667. Policy #0 lag: (min: 0.0, avg: 0.7, max: 3.0) +[2023-09-14 12:31:07,436][109198] Avg episode reward: [(0, '2.511'), (1, '1.081')] +[2023-09-14 12:31:07,438][53585] Saving new best policy, reward=1.081! +[2023-09-14 12:31:07,477][53807] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:31:07,836][53808] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:31:07,836][53808] DAMAGECOUNT value on done: 45.0 +[2023-09-14 12:31:07,836][53808] Sum rewards: 0.317, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.043', 'AMMO3': '0.055', 'WEAPON5': '0.100', 'weapon5': '0.120', 'DAMAGECOUNT': '0.150', 'WEAPON4': '0.200', 'AMMO4': '0.216', 'weapon4': '0.252', 'WEAPON3': '0.300', 'weapon3': '0.308', 'weapon2': '0.570'} +[2023-09-14 12:31:07,852][53807] DAMAGECOUNT value on done: 86.0 +[2023-09-14 12:31:07,852][53807] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:31:08,036][53808] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:31:08,413][53807] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:08,414][53807] DAMAGECOUNT value on done: 118.0 +[2023-09-14 12:31:08,414][53807] Sum rewards: 4.453, reward structure: {'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.050', 'weapon4': '0.098', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.352', 'weapon5': '0.372', 'weapon3': '0.968', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.180'} +[2023-09-14 12:31:08,422][53808] DAMAGECOUNT value on done: 80.0 +[2023-09-14 12:31:08,422][53808] DAMAGECOUNT value on done: 16.0 +[2023-09-14 12:31:08,423][53808] Sum rewards: 1.516, reward structure: {'HEALTH': '-1.160', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.031', 'AMMO2': '-0.006', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO3': '0.030', 'WEAPON5': '0.100', 'weapon5': '0.134', 'WEAPON3': '0.300', 'weapon2': '0.446', 'DAMAGECOUNT': '0.800', 'weapon3': '1.900'} +[2023-09-14 12:31:08,596][53806] DAMAGECOUNT value on done: 115.0 +[2023-09-14 12:31:08,596][53806] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:31:08,597][53806] Sum rewards: 0.581, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'weapon5': '0.054', 'AMMO3': '0.062', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.722', 'FRAGCOUNT': '0.999', 'weapon3': '1.014', 'DAMAGECOUNT': '1.150'} +[2023-09-14 12:31:08,598][53806] Sum rewards: 3.500, reward structure: {'HEALTH': '-1.740', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.011', 'AMMO3': '0.052', 'AMMO4': '0.055', 'weapon5': '0.088', 'WEAPON4': '0.100', 'weapon4': '0.134', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.118', 'weapon3': '2.074'} +[2023-09-14 12:31:08,836][53806] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:31:08,932][53807] DAMAGECOUNT value on done: 165.0 +[2023-09-14 12:31:08,933][53807] DAMAGECOUNT value on done: 275.0 +[2023-09-14 12:31:08,933][53807] Sum rewards: 0.995, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.025', 'AMMO3': '0.092', 'WEAPON5': '0.100', 'AMMO4': '0.127', 'weapon5': '0.128', 'WEAPON4': '0.200', 'weapon4': '0.212', 'weapon2': '0.418', 'WEAPON3': '0.500', 'weapon3': '0.540', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.650'} +[2023-09-14 12:31:08,934][53807] Sum rewards: 4.119, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.035', 'AMMO3': '0.055', 'WEAPON5': '0.100', 'AMMO4': '0.174', 'WEAPON4': '0.200', 'weapon5': '0.220', 'weapon4': '0.294', 'WEAPON3': '0.300', 'weapon3': '0.386', 'weapon2': '0.602', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '2.750'} +[2023-09-14 12:31:09,027][53808] DAMAGECOUNT value on done: 210.0 +[2023-09-14 12:31:09,028][53808] DAMAGECOUNT value on done: 10.0 +[2023-09-14 12:31:09,028][53808] Sum rewards: 5.397, reward structure: {'HEALTH': '-1.980', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.049', 'weapon2': '0.086', 'weapon5': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.632', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.100', 'weapon3': '2.476'} +[2023-09-14 12:31:09,029][53808] Sum rewards: -2.975, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'AMMO4': '-0.019', 'AMMO2': '-0.004', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'DAMAGECOUNT': '0.100', 'AMMO3': '0.107', 'WEAPON5': '0.200', 'weapon5': '0.310', 'WEAPON3': '0.600', 'weapon2': '0.766', 'weapon3': '0.958'} +[2023-09-14 12:31:09,136][53805] DAMAGECOUNT value on done: 40.0 +[2023-09-14 12:31:09,137][53805] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:31:09,137][53805] Sum rewards: 3.837, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.006', 'AMMO4': '0.025', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.212', 'weapon5': '0.320', 'weapon2': '0.348', 'WEAPON3': '0.400', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '2.532'} +[2023-09-14 12:31:09,185][53806] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:09,185][53806] DAMAGECOUNT value on done: 120.0 +[2023-09-14 12:31:09,186][53806] Sum rewards: 4.121, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.570', 'weapon2': '0.712', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.200', 'weapon3': '2.654'} +[2023-09-14 12:31:09,512][53801] Updated weights for policy 0, policy_version 742 (0.0013) +[2023-09-14 12:31:09,610][53808] DAMAGECOUNT value on done: 55.0 +[2023-09-14 12:31:09,610][53808] DAMAGECOUNT value on done: 174.0 +[2023-09-14 12:31:09,644][53811] DAMAGECOUNT value on done: 65.0 +[2023-09-14 12:31:09,644][53811] DAMAGECOUNT value on done: 206.0 +[2023-09-14 12:31:09,645][53811] Sum rewards: 5.933, reward structure: {'HEALTH': '-0.790', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'weapon5': '0.092', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.108', 'WEAPON3': '0.200', 'weapon2': '0.818', 'weapon3': '1.192', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.060'} +[2023-09-14 12:31:09,741][53806] DAMAGECOUNT value on done: 106.0 +[2023-09-14 12:31:09,741][53806] DAMAGECOUNT value on done: 25.0 +[2023-09-14 12:31:09,742][53806] Sum rewards: 3.947, reward structure: {'HEALTH': '-0.250', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'weapon5': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.204', 'weapon2': '0.392', 'weapon3': '0.998', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.060'} +[2023-09-14 12:31:09,812][53805] DAMAGECOUNT value on done: 6.0 +[2023-09-14 12:31:09,812][53805] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:09,813][53805] Sum rewards: 0.637, reward structure: {'HEALTH': '-1.090', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.009', 'AMMO2': '0.025', 'AMMO3': '0.066', 'WEAPON4': '0.100', 'weapon5': '0.112', 'AMMO4': '0.123', 'WEAPON5': '0.200', 'weapon4': '0.244', 'WEAPON3': '0.400', 'weapon2': '0.520', 'weapon3': '0.930'} +[2023-09-14 12:31:09,838][53811] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:31:10,209][53811] DAMAGECOUNT value on done: 102.0 +[2023-09-14 12:31:10,209][53811] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:31:10,210][53811] Sum rewards: 2.416, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.035', 'AMMO2': '-0.007', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.030', 'weapon5': '0.044', 'WEAPON5': '0.100', 'WEAPON3': '0.300', 'weapon2': '0.550', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.020', 'weapon3': '1.410'} +[2023-09-14 12:31:10,243][53810] DAMAGECOUNT value on done: 95.0 +[2023-09-14 12:31:10,243][53810] DAMAGECOUNT value on done: 101.0 +[2023-09-14 12:31:10,244][53810] Sum rewards: 4.010, reward structure: {'HEALTH': '-0.950', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.019', 'AMMO3': '0.020', 'AMMO4': '0.096', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon5': '0.360', 'weapon2': '0.778', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.010', 'weapon3': '1.274'} +[2023-09-14 12:31:10,290][53806] DAMAGECOUNT value on done: 30.0 +[2023-09-14 12:31:10,291][53806] DAMAGECOUNT value on done: 220.0 +[2023-09-14 12:31:10,291][53806] Sum rewards: -1.689, reward structure: {'HEALTH': '-2.300', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.034', 'weapon5': '0.054', 'AMMO3': '0.075', 'WEAPON5': '0.100', 'AMMO4': '0.170', 'WEAPON4': '0.200', 'weapon4': '0.218', 'DAMAGECOUNT': '0.300', 'weapon3': '0.348', 'WEAPON3': '0.400', 'weapon2': '0.708'} +[2023-09-14 12:31:10,291][53806] Sum rewards: 5.827, reward structure: {'HEALTH': '-0.300', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'weapon4': '0.098', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.146', 'WEAPON3': '0.200', 'weapon2': '0.696', 'FRAGCOUNT': '1.000', 'weapon3': '1.534', 'DAMAGECOUNT': '2.200'} +[2023-09-14 12:31:10,472][53810] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:31:10,832][53810] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:10,832][53810] DAMAGECOUNT value on done: 26.0 +[2023-09-14 12:31:10,833][53810] Sum rewards: 3.562, reward structure: {'AMMO4': '-0.012', 'AMMO2': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.021', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon5': '0.210', 'DAMAGECOUNT': '0.260', 'weapon2': '0.496', 'FRAGCOUNT': '1.000', 'weapon3': '1.286'} +[2023-09-14 12:31:11,023][53809] DAMAGECOUNT value on done: 248.0 +[2023-09-14 12:31:11,023][53809] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:31:11,024][53809] Sum rewards: 5.764, reward structure: {'HEALTH': '-1.290', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO4': '0.025', 'AMMO3': '0.049', 'weapon5': '0.162', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.400', 'weapon2': '0.486', 'weapon3': '1.642', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.480'} +[2023-09-14 12:31:11,024][53809] Sum rewards: 2.959, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'AMMO2': '0.023', 'AMMO3': '0.056', 'AMMO4': '0.117', 'weapon2': '0.146', 'WEAPON4': '0.200', 'weapon5': '0.280', 'WEAPON5': '0.300', 'weapon4': '0.382', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '2.992'} +[2023-09-14 12:31:11,307][53809] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:31:11,402][53810] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:31:11,402][53810] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:11,615][53802] Updated weights for policy 1, policy_version 60 (0.0013) +[2023-09-14 12:31:11,703][53809] DAMAGECOUNT value on done: 5.0 +[2023-09-14 12:31:11,703][53809] DAMAGECOUNT value on done: 60.0 +[2023-09-14 12:31:11,703][53809] Sum rewards: -0.164, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.012', 'AMMO3': '0.047', 'DAMAGECOUNT': '0.050', 'AMMO4': '0.060', 'weapon5': '0.066', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.230', 'WEAPON3': '0.300', 'weapon3': '0.730', 'weapon2': '0.738'} +[2023-09-14 12:31:12,012][53810] DAMAGECOUNT value on done: 108.0 +[2023-09-14 12:31:12,012][53810] DAMAGECOUNT value on done: 52.0 +[2023-09-14 12:31:12,013][53810] Sum rewards: 1.627, reward structure: {'HEALTH': '-1.420', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.049', 'WEAPON5': '0.100', 'weapon2': '0.364', 'WEAPON3': '0.400', 'weapon5': '0.432', 'DAMAGECOUNT': '1.080', 'weapon3': '1.650'} +[2023-09-14 12:31:12,013][53810] Sum rewards: 2.162, reward structure: {'HEALTH': '-1.830', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'weapon5': '0.302', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.520', 'weapon2': '1.072', 'weapon3': '2.482'} +[2023-09-14 12:31:12,220][53809] DAMAGECOUNT value on done: 220.0 +[2023-09-14 12:31:12,221][53809] Sum rewards: 6.824, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'weapon5': '0.316', 'WEAPON3': '0.400', 'weapon2': '0.954', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.200', 'weapon3': '2.728'} +[2023-09-14 12:31:12,221][53809] DAMAGECOUNT value on done: 50.0 +[2023-09-14 12:31:12,319][53804] DAMAGECOUNT value on done: 60.0 +[2023-09-14 12:31:12,319][53804] DAMAGECOUNT value on done: 60.0 +[2023-09-14 12:31:12,435][109198] Fps is (10 sec: 14336.0, 60 sec: 11141.2, 300 sec: 11141.2). Total num frames: 3309568. Throughput: 0: 1601.9, 1: 1310.7. Samples: 131067. Policy #0 lag: (min: 0.0, avg: 0.9, max: 2.0) +[2023-09-14 12:31:12,436][109198] Avg episode reward: [(0, '3.080'), (1, '0.861')] +[2023-09-14 12:31:12,439][53511] Saving new best policy, reward=3.080! +[2023-09-14 12:31:12,577][53804] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:31:12,789][53809] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:31:12,790][53809] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:31:12,907][53804] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:31:12,907][53804] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:12,908][53804] Sum rewards: -1.107, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.005', 'AMMO2': '0.007', 'AMMO4': '0.033', 'weapon5': '0.046', 'weapon4': '0.046', 'AMMO3': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.600', 'weapon2': '0.670', 'weapon3': '1.188'} +[2023-09-14 12:31:12,908][53804] Sum rewards: 4.845, reward structure: {'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON5': '0.100', 'weapon6': '0.148', 'WEAPON3': '0.200', 'WEAPON6': '0.200', 'weapon5': '0.350', 'weapon2': '0.374', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.230'} +[2023-09-14 12:31:13,506][53804] DAMAGECOUNT value on done: 161.0 +[2023-09-14 12:31:13,507][53804] DAMAGECOUNT value on done: 242.0 +[2023-09-14 12:31:13,507][53804] Sum rewards: 1.690, reward structure: {'HEALTH': '-2.400', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.010', 'weapon5': '0.010', 'AMMO4': '0.034', 'AMMO3': '0.071', 'AMMO6': '0.100', 'AMMO7': '0.100', 'weapon6': '0.158', 'WEAPON5': '0.200', 'WEAPON6': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.202', 'weapon2': '0.350', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.338', 'DAMAGECOUNT': '1.610'} +[2023-09-14 12:31:13,508][53804] Sum rewards: 4.043, reward structure: {'HEALTH': '-2.450', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO2': '0.006', 'AMMO4': '0.031', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.284', 'weapon4': '0.306', 'WEAPON3': '0.400', 'weapon2': '0.778', 'weapon3': '1.922', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.420'} +[2023-09-14 12:31:13,827][53801] Updated weights for policy 0, policy_version 752 (0.0013) +[2023-09-14 12:31:14,084][53804] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:14,084][53804] DAMAGECOUNT value on done: 374.0 +[2023-09-14 12:31:14,085][53804] Sum rewards: 7.696, reward structure: {'HEALTH': '-0.730', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.020', 'weapon2': '0.034', 'AMMO4': '0.049', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon6': '0.148', 'weapon5': '0.160', 'WEAPON3': '0.200', 'WEAPON6': '0.200', 'weapon4': '0.434', 'weapon3': '1.028', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '3.740'} +[2023-09-14 12:31:17,435][109198] Fps is (10 sec: 14745.7, 60 sec: 11543.3, 300 sec: 11543.3). Total num frames: 3387392. Throughput: 0: 1852.8, 1: 1417.7. Samples: 152765. Policy #0 lag: (min: 0.0, avg: 0.9, max: 2.0) +[2023-09-14 12:31:17,436][109198] Avg episode reward: [(0, '3.204'), (1, '0.761')] +[2023-09-14 12:31:17,438][53511] Saving new best policy, reward=3.204! +[2023-09-14 12:31:18,299][53801] Updated weights for policy 0, policy_version 762 (0.0013) +[2023-09-14 12:31:20,255][53802] Updated weights for policy 1, policy_version 70 (0.0013) +[2023-09-14 12:31:22,435][109198] Fps is (10 sec: 13926.3, 60 sec: 11605.4, 300 sec: 11605.4). Total num frames: 3448832. Throughput: 0: 1997.2, 1: 1439.8. Samples: 172419. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:31:22,436][109198] Avg episode reward: [(0, '3.204'), (1, '0.761')] +[2023-09-14 12:31:23,081][53801] Updated weights for policy 0, policy_version 772 (0.0013) +[2023-09-14 12:31:27,435][109198] Fps is (10 sec: 12287.9, 60 sec: 12629.3, 300 sec: 11657.9). Total num frames: 3510272. Throughput: 0: 2011.2, 1: 1406.6. Samples: 181885. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:31:27,437][109198] Avg episode reward: [(0, '3.204'), (1, '0.761')] +[2023-09-14 12:31:28,082][53801] Updated weights for policy 0, policy_version 782 (0.0015) +[2023-09-14 12:31:29,771][53802] Updated weights for policy 1, policy_version 80 (0.0013) +[2023-09-14 12:31:32,435][109198] Fps is (10 sec: 13107.2, 60 sec: 13653.3, 300 sec: 11819.9). Total num frames: 3579904. Throughput: 0: 2042.9, 1: 1344.3. Samples: 201196. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:31:32,436][109198] Avg episode reward: [(0, '3.204'), (1, '0.761')] +[2023-09-14 12:31:32,716][53801] Updated weights for policy 0, policy_version 792 (0.0013) +[2023-09-14 12:31:32,801][53804] Large shaping reward 2.540 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 2.0), ('DAMAGECOUNT', 1.54, 154.0)] +[2023-09-14 12:31:37,181][53801] Updated weights for policy 0, policy_version 802 (0.0012) +[2023-09-14 12:31:37,435][109198] Fps is (10 sec: 13926.4, 60 sec: 13653.3, 300 sec: 11960.4). Total num frames: 3649536. Throughput: 0: 2099.1, 1: 1295.0. Samples: 222232. Policy #0 lag: (min: 0.0, avg: 0.7, max: 3.0) +[2023-09-14 12:31:37,436][109198] Avg episode reward: [(0, '3.204'), (1, '0.761')] +[2023-09-14 12:31:38,334][53802] Updated weights for policy 1, policy_version 90 (0.0012) +[2023-09-14 12:31:41,931][53801] Updated weights for policy 0, policy_version 812 (0.0014) +[2023-09-14 12:31:42,075][53811] DAMAGECOUNT value on done: 193.0 +[2023-09-14 12:31:42,075][53811] DAMAGECOUNT value on done: 233.0 +[2023-09-14 12:31:42,076][53811] Sum rewards: 6.301, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.009', 'AMMO4': '0.024', 'AMMO3': '0.040', 'weapon2': '0.072', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.214', 'WEAPON3': '0.400', 'weapon4': '0.512', 'FRAGCOUNT': '1.999', 'weapon3': '2.296', 'DAMAGECOUNT': '2.330'} +[2023-09-14 12:31:42,435][109198] Fps is (10 sec: 13516.7, 60 sec: 13653.3, 300 sec: 12032.0). Total num frames: 3715072. Throughput: 0: 2120.1, 1: 1265.5. Samples: 232031. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:31:42,437][109198] Avg episode reward: [(0, '3.201'), (1, '0.761')] +[2023-09-14 12:31:42,686][53811] DAMAGECOUNT value on done: 272.0 +[2023-09-14 12:31:42,687][53811] Sum rewards: 4.893, reward structure: {'HEALTH': '-0.180', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'weapon5': '0.082', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.722', 'FRAGCOUNT': '1.000', 'weapon3': '1.446', 'DAMAGECOUNT': '1.500'} +[2023-09-14 12:31:42,687][53811] DAMAGECOUNT value on done: 123.0 +[2023-09-14 12:31:42,941][53805] DAMAGECOUNT value on done: 48.0 +[2023-09-14 12:31:42,942][53805] DAMAGECOUNT value on done: 25.0 +[2023-09-14 12:31:42,942][53805] Sum rewards: 0.533, reward structure: {'HEALTH': '-1.180', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.031', 'AMMO2': '-0.006', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.048', 'weapon5': '0.198', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.200', 'WEAPON3': '0.300', 'weapon3': '0.832', 'weapon2': '0.964'} +[2023-09-14 12:31:43,676][53805] DAMAGECOUNT value on done: 185.0 +[2023-09-14 12:31:43,677][53805] Sum rewards: 4.454, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.025', 'AMMO3': '0.046', 'weapon5': '0.172', 'WEAPON5': '0.200', 'weapon2': '0.360', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.850', 'weapon3': '2.388'} +[2023-09-14 12:31:43,677][53805] DAMAGECOUNT value on done: 140.0 +[2023-09-14 12:31:47,435][109198] Fps is (10 sec: 11878.3, 60 sec: 13380.3, 300 sec: 11950.7). Total num frames: 3768320. Throughput: 0: 2141.2, 1: 1206.5. Samples: 250199. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:31:47,437][109198] Avg episode reward: [(0, '3.221'), (1, '0.705')] +[2023-09-14 12:31:47,438][53511] Saving new best policy, reward=3.221! +[2023-09-14 12:31:47,480][53807] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:47,480][53807] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:47,598][53801] Updated weights for policy 0, policy_version 822 (0.0016) +[2023-09-14 12:31:48,063][53802] Updated weights for policy 1, policy_version 100 (0.0014) +[2023-09-14 12:31:48,164][53808] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:31:48,164][53808] DAMAGECOUNT value on done: 91.0 +[2023-09-14 12:31:48,164][53808] Sum rewards: 3.165, reward structure: {'HEALTH': '-0.460', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'weapon5': '0.046', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.354', 'DAMAGECOUNT': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.032'} +[2023-09-14 12:31:48,165][53808] Sum rewards: 0.479, reward structure: {'HEALTH': '-2.400', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.057', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.298', 'weapon2': '0.368', 'DAMAGECOUNT': '0.460', 'weapon5': '0.488', 'WEAPON3': '0.500', 'weapon3': '2.402'} +[2023-09-14 12:31:48,217][53807] DAMAGECOUNT value on done: 301.0 +[2023-09-14 12:31:48,217][53807] DAMAGECOUNT value on done: 93.0 +[2023-09-14 12:31:48,218][53807] Sum rewards: 6.126, reward structure: {'HEALTH': '-1.330', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.042', 'weapon2': '0.060', 'WEAPON4': '0.100', 'weapon4': '0.196', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.996', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150', 'weapon3': '2.304'} +[2023-09-14 12:31:48,218][53807] Sum rewards: 0.332, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.013', 'AMMO3': '0.032', 'weapon5': '0.044', 'AMMO4': '0.064', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.240', 'WEAPON3': '0.300', 'weapon2': '0.356', 'DAMAGECOUNT': '0.780', 'FRAGCOUNT': '1.000', 'weapon3': '1.300'} +[2023-09-14 12:31:48,468][53806] DAMAGECOUNT value on done: 146.0 +[2023-09-14 12:31:48,469][53806] Sum rewards: 0.877, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO2': '0.011', 'AMMO4': '0.055', 'AMMO3': '0.076', 'WEAPON4': '0.100', 'weapon4': '0.102', 'WEAPON5': '0.200', 'weapon2': '0.348', 'DAMAGECOUNT': '0.460', 'weapon5': '0.476', 'WEAPON3': '0.600', 'weapon3': '2.444'} +[2023-09-14 12:31:48,469][53806] DAMAGECOUNT value on done: 310.0 +[2023-09-14 12:31:48,469][53806] Sum rewards: 4.317, reward structure: {'HEALTH': '-0.460', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'weapon5': '0.046', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.354', 'weapon3': '0.904', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.950'} +[2023-09-14 12:31:48,657][53807] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:31:48,659][53807] Sum rewards: 0.510, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'AMMO4': '-0.023', 'AMMO2': '-0.004', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'weapon5': '0.028', 'AMMO3': '0.041', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.150', 'WEAPON3': '0.300', 'weapon2': '0.756', 'weapon3': '1.158'} +[2023-09-14 12:31:48,660][53807] DAMAGECOUNT value on done: 118.0 +[2023-09-14 12:31:49,017][53808] DAMAGECOUNT value on done: 177.0 +[2023-09-14 12:31:49,017][53808] DAMAGECOUNT value on done: 220.0 +[2023-09-14 12:31:49,018][53808] Sum rewards: 3.708, reward structure: {'HEALTH': '-1.430', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.025', 'AMMO3': '0.050', 'weapon5': '0.092', 'WEAPON4': '0.100', 'weapon4': '0.110', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.698', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.610', 'weapon3': '1.840'} +[2023-09-14 12:31:49,018][53808] Sum rewards: 2.649, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.043', 'AMMO3': '0.053', 'WEAPON5': '0.100', 'weapon5': '0.124', 'weapon4': '0.186', 'WEAPON4': '0.200', 'AMMO4': '0.215', 'WEAPON3': '0.300', 'weapon3': '0.476', 'weapon2': '0.548', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.400'} +[2023-09-14 12:31:49,282][53806] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:31:49,282][53806] DAMAGECOUNT value on done: 120.0 +[2023-09-14 12:31:49,366][53807] DAMAGECOUNT value on done: 415.0 +[2023-09-14 12:31:49,366][53807] DAMAGECOUNT value on done: 407.0 +[2023-09-14 12:31:49,367][53807] Sum rewards: 3.119, reward structure: {'HEALTH': '-1.550', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.025', 'AMMO3': '0.055', 'weapon5': '0.156', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon2': '1.116', 'DAMAGECOUNT': '1.320', 'weapon3': '1.384'} +[2023-09-14 12:31:49,699][53808] DAMAGECOUNT value on done: 49.0 +[2023-09-14 12:31:49,699][53808] DAMAGECOUNT value on done: 210.0 +[2023-09-14 12:31:49,877][53805] DAMAGECOUNT value on done: 173.0 +[2023-09-14 12:31:49,878][53805] DAMAGECOUNT value on done: 175.0 +[2023-09-14 12:31:49,879][53805] Sum rewards: -1.822, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'AMMO4': '-0.019', 'AMMO2': '-0.004', 'FRAGCOUNT': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.011', 'AMMO3': '0.105', 'weapon5': '0.272', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.662', 'weapon3': '0.922', 'DAMAGECOUNT': '1.330'} +[2023-09-14 12:31:50,024][53806] DAMAGECOUNT value on done: 323.0 +[2023-09-14 12:31:50,024][53806] Sum rewards: 2.934, reward structure: {'HEALTH': '-1.850', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.014', 'weapon4': '0.022', 'AMMO3': '0.030', 'AMMO4': '0.068', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.238', 'WEAPON3': '0.300', 'weapon2': '0.376', 'FRAGCOUNT': '0.999', 'weapon3': '1.262', 'DAMAGECOUNT': '2.170'} +[2023-09-14 12:31:50,025][53806] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:31:50,144][53811] DAMAGECOUNT value on done: 200.0 +[2023-09-14 12:31:50,144][53811] DAMAGECOUNT value on done: 311.0 +[2023-09-14 12:31:50,145][53811] Sum rewards: 2.554, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.021', 'AMMO3': '0.052', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.104', 'weapon5': '0.108', 'weapon4': '0.262', 'WEAPON3': '0.300', 'weapon3': '0.540', 'weapon2': '0.614', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.350'} +[2023-09-14 12:31:50,145][53811] Sum rewards: 2.457, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'AMMO4': '-0.033', 'AMMO2': '-0.007', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.034', 'WEAPON5': '0.100', 'WEAPON3': '0.300', 'weapon5': '0.372', 'weapon2': '0.490', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.146'} +[2023-09-14 12:31:50,420][53808] DAMAGECOUNT value on done: 218.0 +[2023-09-14 12:31:50,420][53808] DAMAGECOUNT value on done: 70.0 +[2023-09-14 12:31:50,602][53805] DAMAGECOUNT value on done: 78.0 +[2023-09-14 12:31:50,602][53805] DAMAGECOUNT value on done: 70.0 +[2023-09-14 12:31:50,603][53805] Sum rewards: 0.475, reward structure: {'HEALTH': '-1.720', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.046', 'WEAPON5': '0.200', 'WEAPON3': '0.300', 'weapon5': '0.320', 'weapon2': '0.646', 'DAMAGECOUNT': '0.700', 'weapon3': '0.994'} +[2023-09-14 12:31:50,895][53806] DAMAGECOUNT value on done: 220.0 +[2023-09-14 12:31:50,895][53806] DAMAGECOUNT value on done: 110.0 +[2023-09-14 12:31:50,965][53811] DAMAGECOUNT value on done: 117.0 +[2023-09-14 12:31:50,966][53811] DAMAGECOUNT value on done: 170.0 +[2023-09-14 12:31:52,435][109198] Fps is (10 sec: 10649.6, 60 sec: 13107.2, 300 sec: 11878.4). Total num frames: 3821568. Throughput: 0: 2094.4, 1: 1145.0. Samples: 266440. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:31:52,436][109198] Avg episode reward: [(0, '2.894'), (1, '0.918')] +[2023-09-14 12:31:53,700][53801] Updated weights for policy 0, policy_version 832 (0.0033) +[2023-09-14 12:31:53,929][53809] DAMAGECOUNT value on done: 195.0 +[2023-09-14 12:31:53,929][53809] DAMAGECOUNT value on done: 458.0 +[2023-09-14 12:31:53,931][53809] Sum rewards: -1.503, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.035', 'weapon5': '0.052', 'weapon4': '0.090', 'AMMO3': '0.100', 'AMMO4': '0.173', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.900', 'weapon2': '0.958', 'weapon3': '1.180'} +[2023-09-14 12:31:53,932][53809] Sum rewards: 6.235, reward structure: {'HEALTH': '-0.900', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'weapon2': '0.046', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.346', 'weapon5': '0.850', 'weapon3': '1.340', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:31:54,459][53810] DAMAGECOUNT value on done: 227.0 +[2023-09-14 12:31:54,460][53810] Sum rewards: 1.562, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.012', 'AMMO5': '0.014', 'AMMO4': '0.061', 'WEAPON4': '0.100', 'AMMO3': '0.106', 'weapon5': '0.126', 'WEAPON5': '0.300', 'weapon4': '0.348', 'WEAPON3': '0.600', 'weapon2': '0.730', 'weapon3': '0.846', 'FRAGCOUNT': '0.998', 'DAMAGECOUNT': '1.320'} +[2023-09-14 12:31:54,460][53810] DAMAGECOUNT value on done: 190.0 +[2023-09-14 12:31:54,628][53809] DAMAGECOUNT value on done: 88.0 +[2023-09-14 12:31:54,628][53809] DAMAGECOUNT value on done: 22.0 +[2023-09-14 12:31:54,630][53809] Sum rewards: 0.509, reward structure: {'HEALTH': '-1.170', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.028', 'AMMO2': '-0.006', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO3': '0.046', 'WEAPON5': '0.100', 'weapon5': '0.180', 'DAMAGECOUNT': '0.280', 'WEAPON3': '0.300', 'weapon2': '0.896', 'weapon3': '0.908'} +[2023-09-14 12:31:55,211][53809] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:31:55,211][53809] DAMAGECOUNT value on done: 220.0 +[2023-09-14 12:31:55,253][53810] DAMAGECOUNT value on done: 160.0 +[2023-09-14 12:31:55,253][53810] DAMAGECOUNT value on done: 316.0 +[2023-09-14 12:31:55,254][53810] Sum rewards: 2.256, reward structure: {'HEALTH': '-2.750', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon5': '0.008', 'AMMO5': '0.015', 'AMMO2': '0.017', 'AMMO3': '0.054', 'AMMO4': '0.085', 'WEAPON4': '0.100', 'weapon4': '0.156', 'WEAPON5': '0.300', 'WEAPON3': '0.500', 'weapon2': '0.576', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.600', 'weapon3': '2.594'} +[2023-09-14 12:31:55,254][53810] Sum rewards: 6.352, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.025', 'AMMO3': '0.044', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.262', 'weapon4': '0.264', 'weapon2': '0.276', 'WEAPON3': '0.400', 'FRAGCOUNT': '2.000', 'weapon3': '2.368', 'DAMAGECOUNT': '2.900'} +[2023-09-14 12:31:55,763][53810] DAMAGECOUNT value on done: 124.0 +[2023-09-14 12:31:55,763][53810] DAMAGECOUNT value on done: 97.0 +[2023-09-14 12:31:55,764][53810] Sum rewards: 1.753, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.029', 'AMMO3': '0.030', 'WEAPON5': '0.100', 'weapon5': '0.140', 'AMMO4': '0.146', 'WEAPON3': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.546', 'weapon2': '0.558', 'weapon3': '0.830', 'DAMAGECOUNT': '0.970'} +[2023-09-14 12:31:55,971][53802] Updated weights for policy 1, policy_version 110 (0.0012) +[2023-09-14 12:31:55,984][53809] DAMAGECOUNT value on done: 60.0 +[2023-09-14 12:31:55,985][53809] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:31:55,985][53809] Sum rewards: 0.670, reward structure: {'HEALTH': '-1.450', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.009', 'AMMO2': '0.037', 'weapon4': '0.046', 'AMMO3': '0.058', 'weapon5': '0.086', 'AMMO4': '0.185', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.636', 'weapon3': '1.264'} +[2023-09-14 12:31:56,363][53810] DAMAGECOUNT value on done: 203.0 +[2023-09-14 12:31:56,363][53810] DAMAGECOUNT value on done: 118.0 +[2023-09-14 12:31:56,363][53810] Sum rewards: 5.111, reward structure: {'HEALTH': '-0.100', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.050', 'weapon2': '0.072', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.418', 'weapon5': '0.436', 'FRAGCOUNT': '1.000', 'weapon3': '1.292', 'DAMAGECOUNT': '1.510'} +[2023-09-14 12:31:56,814][53804] DAMAGECOUNT value on done: 115.0 +[2023-09-14 12:31:56,815][53804] DAMAGECOUNT value on done: 95.0 +[2023-09-14 12:31:57,435][109198] Fps is (10 sec: 11878.5, 60 sec: 13107.2, 300 sec: 11943.1). Total num frames: 3887104. Throughput: 0: 2058.5, 1: 1143.3. Samples: 275145. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:31:57,436][109198] Avg episode reward: [(0, '2.917'), (1, '0.967')] +[2023-09-14 12:31:57,614][53804] DAMAGECOUNT value on done: 50.0 +[2023-09-14 12:31:57,614][53804] DAMAGECOUNT value on done: 284.0 +[2023-09-14 12:31:57,615][53804] Sum rewards: 4.045, reward structure: {'HEALTH': '-0.900', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'weapon2': '0.026', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.122', 'WEAPON3': '0.200', 'weapon4': '0.354', 'FRAGCOUNT': '1.000', 'weapon3': '1.200', 'DAMAGECOUNT': '1.790'} +[2023-09-14 12:31:58,409][53804] DAMAGECOUNT value on done: 292.0 +[2023-09-14 12:31:58,409][53804] DAMAGECOUNT value on done: 367.0 +[2023-09-14 12:31:58,411][53804] Sum rewards: 3.506, reward structure: {'HEALTH': '-2.150', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.006', 'AMMO5': '0.013', 'AMMO4': '0.028', 'AMMO3': '0.052', 'WEAPON5': '0.300', 'weapon2': '0.420', 'WEAPON3': '0.500', 'weapon5': '0.512', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '2.060', 'weapon3': '2.766'} +[2023-09-14 12:31:59,119][53804] DAMAGECOUNT value on done: 200.0 +[2023-09-14 12:31:59,120][53804] DAMAGECOUNT value on done: 374.0 +[2023-09-14 12:31:59,120][53804] Sum rewards: 6.678, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon4': '0.100', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.678', 'weapon5': '0.932', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.000', 'weapon3': '2.248'} +[2023-09-14 12:32:00,253][53801] Updated weights for policy 0, policy_version 842 (0.0016) +[2023-09-14 12:32:02,435][109198] Fps is (10 sec: 12697.7, 60 sec: 13038.9, 300 sec: 11960.4). Total num frames: 3948544. Throughput: 0: 1948.4, 1: 1183.2. Samples: 293687. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:32:02,436][109198] Avg episode reward: [(0, '2.968'), (1, '0.923')] +[2023-09-14 12:32:02,502][53802] Updated weights for policy 1, policy_version 120 (0.0014) +[2023-09-14 12:32:06,541][53801] Updated weights for policy 0, policy_version 852 (0.0014) +[2023-09-14 12:32:07,435][109198] Fps is (10 sec: 13107.2, 60 sec: 12970.7, 300 sec: 12054.0). Total num frames: 4018176. Throughput: 0: 1877.5, 1: 1265.2. Samples: 313839. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:32:07,436][109198] Avg episode reward: [(0, '2.968'), (1, '0.923')] +[2023-09-14 12:32:08,142][53802] Updated weights for policy 1, policy_version 130 (0.0013) +[2023-09-14 12:32:12,435][109198] Fps is (10 sec: 13926.3, 60 sec: 12970.7, 300 sec: 12139.1). Total num frames: 4087808. Throughput: 0: 1849.8, 1: 1312.2. Samples: 324179. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:32:12,436][109198] Avg episode reward: [(0, '2.968'), (1, '0.923')] +[2023-09-14 12:32:12,441][53511] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000861_3526656.pth... +[2023-09-14 12:32:12,441][53585] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000137_561152.pth... +[2023-09-14 12:32:12,504][53511] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000603_2469888.pth +[2023-09-14 12:32:12,613][53801] Updated weights for policy 0, policy_version 862 (0.0015) +[2023-09-14 12:32:13,717][53802] Updated weights for policy 1, policy_version 140 (0.0013) +[2023-09-14 12:32:17,435][109198] Fps is (10 sec: 14336.0, 60 sec: 12902.4, 300 sec: 12252.4). Total num frames: 4161536. Throughput: 0: 1798.9, 1: 1412.4. Samples: 345703. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:32:17,437][109198] Avg episode reward: [(0, '2.968'), (1, '0.923')] +[2023-09-14 12:32:18,499][53801] Updated weights for policy 0, policy_version 872 (0.0013) +[2023-09-14 12:32:19,220][53802] Updated weights for policy 1, policy_version 150 (0.0012) +[2023-09-14 12:32:22,435][109198] Fps is (10 sec: 14335.8, 60 sec: 13038.9, 300 sec: 12322.1). Total num frames: 4231168. Throughput: 0: 1724.8, 1: 1497.4. Samples: 367235. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:32:22,437][109198] Avg episode reward: [(0, '2.968'), (1, '0.923')] +[2023-09-14 12:32:23,066][53811] DAMAGECOUNT value on done: 253.0 +[2023-09-14 12:32:23,066][53811] DAMAGECOUNT value on done: 243.0 +[2023-09-14 12:32:23,067][53811] Sum rewards: 1.431, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.020', 'AMMO3': '0.063', 'WEAPON5': '0.100', 'AMMO4': '0.101', 'weapon5': '0.168', 'DAMAGECOUNT': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.246', 'WEAPON3': '0.400', 'weapon2': '0.800', 'weapon3': '1.130'} +[2023-09-14 12:32:23,423][53805] DAMAGECOUNT value on done: 48.0 +[2023-09-14 12:32:23,424][53805] DAMAGECOUNT value on done: 230.0 +[2023-09-14 12:32:23,424][53805] Sum rewards: 4.681, reward structure: {'HEALTH': '-0.600', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'weapon5': '0.122', 'WEAPON3': '0.200', 'weapon2': '0.720', 'FRAGCOUNT': '1.000', 'weapon3': '1.066', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:32:23,606][53811] DAMAGECOUNT value on done: 208.0 +[2023-09-14 12:32:23,606][53811] DAMAGECOUNT value on done: 272.0 +[2023-09-14 12:32:23,959][53805] DAMAGECOUNT value on done: 370.0 +[2023-09-14 12:32:23,959][53805] DAMAGECOUNT value on done: 245.0 +[2023-09-14 12:32:23,959][53805] Sum rewards: 3.422, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.037', 'AMMO4': '0.050', 'weapon2': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.174', 'WEAPON3': '0.300', 'weapon4': '0.446', 'FRAGCOUNT': '1.000', 'weapon3': '1.262', 'DAMAGECOUNT': '1.850'} +[2023-09-14 12:32:23,960][53805] Sum rewards: 2.606, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.014', 'AMMO4': '0.033', 'AMMO3': '0.059', 'weapon5': '0.168', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.424', 'weapon2': '0.428', 'WEAPON3': '0.500', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '2.424'} +[2023-09-14 12:32:24,259][53801] Updated weights for policy 0, policy_version 882 (0.0013) +[2023-09-14 12:32:24,815][53802] Updated weights for policy 1, policy_version 160 (0.0013) +[2023-09-14 12:32:26,552][53807] DAMAGECOUNT value on done: 168.0 +[2023-09-14 12:32:26,553][53807] DAMAGECOUNT value on done: 35.0 +[2023-09-14 12:32:26,553][53807] Sum rewards: 4.560, reward structure: {'HEALTH': '-0.500', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'weapon2': '0.006', 'AMMO3': '0.019', 'AMMO4': '0.025', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.334', 'weapon5': '0.334', 'FRAGCOUNT': '1.000', 'weapon3': '1.254', 'DAMAGECOUNT': '1.680'} +[2023-09-14 12:32:26,554][53807] Sum rewards: -0.299, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'weapon5': '0.034', 'AMMO3': '0.052', 'AMMO4': '0.098', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.350', 'weapon3': '0.526', 'weapon4': '0.720', 'weapon2': '1.296'} +[2023-09-14 12:32:26,925][53811] Large shaping reward 2.602 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 1.0), ('DAMAGECOUNT', 1.6, 160.0), ('weapon5', 0.002)] +[2023-09-14 12:32:27,068][53807] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:32:27,068][53807] DAMAGECOUNT value on done: 321.0 +[2023-09-14 12:32:27,435][109198] Fps is (10 sec: 14336.0, 60 sec: 13243.7, 300 sec: 12419.1). Total num frames: 4304896. Throughput: 0: 1698.0, 1: 1553.1. Samples: 378331. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:32:27,437][109198] Avg episode reward: [(0, '2.982'), (1, '0.956')] +[2023-09-14 12:32:27,513][53807] DAMAGECOUNT value on done: 65.0 +[2023-09-14 12:32:27,513][53807] DAMAGECOUNT value on done: 203.0 +[2023-09-14 12:32:27,514][53807] Sum rewards: 0.422, reward structure: {'HEALTH': '-1.970', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.011', 'AMMO4': '0.056', 'AMMO3': '0.063', 'WEAPON4': '0.100', 'weapon4': '0.142', 'weapon5': '0.174', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.500', 'weapon2': '0.830', 'weapon3': '0.908'} +[2023-09-14 12:32:28,085][53807] DAMAGECOUNT value on done: 615.0 +[2023-09-14 12:32:28,085][53807] DAMAGECOUNT value on done: 437.0 +[2023-09-14 12:32:28,085][53807] Sum rewards: 4.640, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO3': '0.063', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.200', 'weapon5': '0.266', 'WEAPON3': '0.500', 'weapon2': '1.060', 'FRAGCOUNT': '1.998', 'DAMAGECOUNT': '2.000', 'weapon3': '2.262'} +[2023-09-14 12:32:28,122][53808] DAMAGECOUNT value on done: 165.0 +[2023-09-14 12:32:28,122][53808] DAMAGECOUNT value on done: 266.0 +[2023-09-14 12:32:28,123][53808] Sum rewards: 4.347, reward structure: {'HEALTH': '-0.600', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'weapon5': '0.078', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.716', 'FRAGCOUNT': '1.000', 'weapon3': '1.080', 'DAMAGECOUNT': '1.750'} +[2023-09-14 12:32:28,700][53808] DAMAGECOUNT value on done: 284.0 +[2023-09-14 12:32:28,701][53808] DAMAGECOUNT value on done: 235.0 +[2023-09-14 12:32:28,701][53808] Sum rewards: 3.533, reward structure: {'HEALTH': '-0.820', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.352', 'weapon5': '0.420', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.070', 'weapon3': '1.218'} +[2023-09-14 12:32:28,784][53806] DAMAGECOUNT value on done: 310.0 +[2023-09-14 12:32:28,785][53806] DAMAGECOUNT value on done: 146.0 +[2023-09-14 12:32:28,797][53805] DAMAGECOUNT value on done: 193.0 +[2023-09-14 12:32:28,798][53805] DAMAGECOUNT value on done: 320.0 +[2023-09-14 12:32:28,798][53805] Sum rewards: 0.351, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.029', 'AMMO3': '0.089', 'AMMO4': '0.144', 'weapon5': '0.154', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.302', 'WEAPON3': '0.500', 'weapon3': '0.654', 'weapon2': '0.766', 'FRAGCOUNT': '0.999'} +[2023-09-14 12:32:28,799][53805] Sum rewards: 3.662, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO4': '0.024', 'AMMO3': '0.030', 'WEAPON5': '0.100', 'weapon5': '0.136', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.334', 'weapon4': '0.508', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.450', 'weapon3': '1.622'} +[2023-09-14 12:32:29,259][53808] DAMAGECOUNT value on done: 220.0 +[2023-09-14 12:32:29,259][53808] DAMAGECOUNT value on done: 99.0 +[2023-09-14 12:32:29,260][53808] Sum rewards: 0.883, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.004', 'AMMO4': '0.019', 'AMMO3': '0.037', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.144', 'WEAPON3': '0.300', 'weapon2': '0.856', 'weapon3': '1.270'} +[2023-09-14 12:32:29,260][53808] Sum rewards: 1.630, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO3': '0.022', 'AMMO2': '0.025', 'WEAPON5': '0.100', 'AMMO4': '0.124', 'weapon5': '0.156', 'WEAPON4': '0.200', 'WEAPON3': '0.200', 'weapon4': '0.418', 'DAMAGECOUNT': '0.500', 'weapon2': '0.970', 'weapon3': '1.012'} +[2023-09-14 12:32:29,338][53811] DAMAGECOUNT value on done: 451.0 +[2023-09-14 12:32:29,338][53811] DAMAGECOUNT value on done: 516.0 +[2023-09-14 12:32:29,339][53811] Sum rewards: 4.354, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO4': '0.013', 'AMMO5': '0.014', 'AMMO3': '0.064', 'WEAPON4': '0.100', 'weapon5': '0.110', 'weapon2': '0.230', 'WEAPON5': '0.300', 'weapon4': '0.336', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '2.510', 'weapon3': '3.074'} +[2023-09-14 12:32:29,339][53811] Sum rewards: 3.594, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.057', 'AMMO2': '-0.011', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.063', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON6': '0.200', 'weapon5': '0.228', 'WEAPON5': '0.300', 'weapon6': '0.354', 'WEAPON3': '0.500', 'weapon2': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.902', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:32:29,346][53806] DAMAGECOUNT value on done: 220.0 +[2023-09-14 12:32:29,346][53806] DAMAGECOUNT value on done: 95.0 +[2023-09-14 12:32:29,347][53806] Sum rewards: 2.782, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.017', 'AMMO3': '0.039', 'AMMO4': '0.085', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.270', 'WEAPON3': '0.300', 'weapon2': '0.540', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.328'} +[2023-09-14 12:32:29,348][53806] Sum rewards: 2.760, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.006', 'AMMO4': '0.030', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon4': '0.246', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.950', 'weapon2': '0.976', 'FRAGCOUNT': '1.000', 'weapon3': '1.112'} +[2023-09-14 12:32:29,370][53805] DAMAGECOUNT value on done: 298.0 +[2023-09-14 12:32:29,371][53805] DAMAGECOUNT value on done: 150.0 +[2023-09-14 12:32:29,371][53805] Sum rewards: 6.434, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.050', 'weapon2': '0.088', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.246', 'WEAPON3': '0.400', 'weapon4': '0.628', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.200', 'weapon3': '2.664'} +[2023-09-14 12:32:29,834][53808] DAMAGECOUNT value on done: 308.0 +[2023-09-14 12:32:29,835][53808] DAMAGECOUNT value on done: 365.0 +[2023-09-14 12:32:29,835][53808] Sum rewards: 7.432, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.009', 'AMMO4': '0.027', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.220', 'weapon2': '0.384', 'WEAPON3': '0.400', 'weapon4': '0.456', 'FRAGCOUNT': '1.999', 'weapon3': '2.642', 'DAMAGECOUNT': '2.950'} +[2023-09-14 12:32:29,942][53811] DAMAGECOUNT value on done: 360.0 +[2023-09-14 12:32:29,942][53811] DAMAGECOUNT value on done: 305.0 +[2023-09-14 12:32:29,943][53811] Sum rewards: 4.898, reward structure: {'HEALTH': '-1.180', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.011', 'weapon5': '0.052', 'AMMO4': '0.055', 'AMMO3': '0.060', 'weapon4': '0.182', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.782', 'weapon3': '1.226', 'DAMAGECOUNT': '1.900', 'FRAGCOUNT': '2.000'} +[2023-09-14 12:32:29,944][53811] Sum rewards: 2.472, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.012', 'weapon2': '0.036', 'AMMO3': '0.046', 'AMMO4': '0.058', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.300', 'WEAPON3': '0.400', 'weapon4': '0.438', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.880', 'weapon3': '1.894'} +[2023-09-14 12:32:29,970][53806] DAMAGECOUNT value on done: 343.0 +[2023-09-14 12:32:29,970][53806] DAMAGECOUNT value on done: 155.0 +[2023-09-14 12:32:29,971][53806] Sum rewards: 1.641, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'weapon5': '0.062', 'WEAPON5': '0.200', 'weapon2': '0.352', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.500', 'weapon3': '2.308'} +[2023-09-14 12:32:30,068][53801] Updated weights for policy 0, policy_version 892 (0.0012) +[2023-09-14 12:32:30,207][53802] Updated weights for policy 1, policy_version 170 (0.0013) +[2023-09-14 12:32:30,535][53806] DAMAGECOUNT value on done: 170.0 +[2023-09-14 12:32:30,535][53806] DAMAGECOUNT value on done: 240.0 +[2023-09-14 12:32:32,435][109198] Fps is (10 sec: 15155.5, 60 sec: 13380.3, 300 sec: 12540.1). Total num frames: 4382720. Throughput: 0: 1673.0, 1: 1660.6. Samples: 400212. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:32:32,437][109198] Avg episode reward: [(0, '3.016'), (1, '1.155')] +[2023-09-14 12:32:32,441][53585] Saving new best policy, reward=1.155! +[2023-09-14 12:32:32,476][53809] DAMAGECOUNT value on done: 468.0 +[2023-09-14 12:32:32,476][53809] DAMAGECOUNT value on done: 200.0 +[2023-09-14 12:32:33,002][53809] DAMAGECOUNT value on done: 37.0 +[2023-09-14 12:32:33,002][53809] DAMAGECOUNT value on done: 103.0 +[2023-09-14 12:32:33,003][53809] Sum rewards: 0.854, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.031', 'AMMO2': '0.038', 'weapon5': '0.128', 'DAMAGECOUNT': '0.150', 'AMMO4': '0.188', 'WEAPON3': '0.200', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.318', 'weapon3': '0.550', 'weapon2': '0.942'} +[2023-09-14 12:32:33,003][53809] Sum rewards: 2.736, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'weapon2': '0.022', 'AMMO4': '0.025', 'AMMO3': '0.040', 'DAMAGECOUNT': '0.150', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.558', 'weapon5': '0.810', 'weapon3': '2.468'} +[2023-09-14 12:32:33,471][53809] DAMAGECOUNT value on done: 235.0 +[2023-09-14 12:32:33,471][53809] DAMAGECOUNT value on done: 276.0 +[2023-09-14 12:32:33,472][53809] Sum rewards: 5.135, reward structure: {'HEALTH': '-0.150', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'weapon5': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon2': '0.102', 'WEAPON3': '0.200', 'weapon4': '0.330', 'FRAGCOUNT': '1.000', 'weapon3': '1.300', 'DAMAGECOUNT': '2.010'} +[2023-09-14 12:32:33,703][53810] DAMAGECOUNT value on done: 205.0 +[2023-09-14 12:32:33,703][53810] DAMAGECOUNT value on done: 227.0 +[2023-09-14 12:32:33,704][53810] Sum rewards: 0.215, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.004', 'AMMO2': '0.004', 'AMMO4': '0.021', 'AMMO3': '0.027', 'weapon5': '0.082', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.480', 'weapon4': '0.590', 'weapon3': '0.758'} +[2023-09-14 12:32:34,015][53809] DAMAGECOUNT value on done: 55.0 +[2023-09-14 12:32:34,016][53809] DAMAGECOUNT value on done: 90.0 +[2023-09-14 12:32:34,016][53809] Sum rewards: 2.578, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.014', 'AMMO3': '0.040', 'AMMO4': '0.068', 'WEAPON4': '0.100', 'weapon5': '0.134', 'WEAPON5': '0.200', 'weapon4': '0.250', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.400', 'weapon2': '0.490', 'weapon3': '2.774'} +[2023-09-14 12:32:34,263][53810] DAMAGECOUNT value on done: 320.0 +[2023-09-14 12:32:34,263][53810] Sum rewards: 3.223, reward structure: {'HEALTH': '-1.180', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.009', 'AMMO3': '0.042', 'AMMO4': '0.045', 'weapon5': '0.098', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.224', 'WEAPON3': '0.300', 'weapon2': '0.838', 'FRAGCOUNT': '1.000', 'weapon3': '1.042', 'DAMAGECOUNT': '1.600'} +[2023-09-14 12:32:34,264][53810] DAMAGECOUNT value on done: 415.0 +[2023-09-14 12:32:34,264][53810] Sum rewards: 2.615, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.025', 'AMMO3': '0.049', 'weapon5': '0.082', 'weapon2': '0.098', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.310', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.990', 'FRAGCOUNT': '1.000', 'weapon3': '1.948'} +[2023-09-14 12:32:34,849][53810] DAMAGECOUNT value on done: 234.0 +[2023-09-14 12:32:34,849][53810] DAMAGECOUNT value on done: 97.0 +[2023-09-14 12:32:34,850][53810] Sum rewards: 4.768, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.010', 'weapon2': '0.034', 'AMMO3': '0.040', 'AMMO4': '0.050', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.254', 'WEAPON3': '0.400', 'weapon4': '0.632', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.100', 'weapon3': '2.842'} +[2023-09-14 12:32:34,850][53810] Sum rewards: -0.338, reward structure: {'HEALTH': '-2.050', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.009', 'AMMO2': '0.036', 'weapon5': '0.058', 'AMMO3': '0.062', 'AMMO4': '0.179', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.418', 'weapon2': '1.066', 'weapon3': '1.084'} +[2023-09-14 12:32:35,483][53810] DAMAGECOUNT value on done: 118.0 +[2023-09-14 12:32:35,484][53810] Sum rewards: 0.967, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.008', 'AMMO3': '0.050', 'weapon5': '0.164', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.896', 'weapon3': '1.596'} +[2023-09-14 12:32:35,484][53810] DAMAGECOUNT value on done: 283.0 +[2023-09-14 12:32:35,485][53810] Sum rewards: 0.565, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'FRAGCOUNT': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.046', 'weapon5': '0.080', 'AMMO3': '0.083', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'AMMO4': '0.228', 'weapon4': '0.436', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.800', 'weapon2': '0.946', 'weapon3': '1.038'} +[2023-09-14 12:32:35,665][53802] Updated weights for policy 1, policy_version 180 (0.0013) +[2023-09-14 12:32:35,872][53801] Updated weights for policy 0, policy_version 902 (0.0012) +[2023-09-14 12:32:36,891][53804] DAMAGECOUNT value on done: 125.0 +[2023-09-14 12:32:36,893][53804] DAMAGECOUNT value on done: 140.0 +[2023-09-14 12:32:36,894][53804] Sum rewards: 2.693, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.019', 'AMMO3': '0.040', 'AMMO4': '0.095', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.246', 'DAMAGECOUNT': '0.250', 'weapon2': '0.370', 'WEAPON3': '0.400', 'weapon5': '0.430', 'weapon3': '2.586'} +[2023-09-14 12:32:37,435][109198] Fps is (10 sec: 14745.6, 60 sec: 13380.3, 300 sec: 12591.4). Total num frames: 4452352. Throughput: 0: 1690.9, 1: 1763.8. Samples: 421902. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:32:37,437][109198] Avg episode reward: [(0, '3.061'), (1, '1.196')] +[2023-09-14 12:32:37,438][53585] Saving new best policy, reward=1.196! +[2023-09-14 12:32:37,650][53804] DAMAGECOUNT value on done: 125.0 +[2023-09-14 12:32:37,651][53804] Sum rewards: 1.586, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'FRAGCOUNT': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.018', 'AMMO3': '0.073', 'AMMO4': '0.090', 'weapon5': '0.124', 'weapon2': '0.166', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.246', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.750', 'weapon3': '3.114'} +[2023-09-14 12:32:37,651][53804] DAMAGECOUNT value on done: 284.0 +[2023-09-14 12:32:37,651][53804] Sum rewards: 0.934, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.004', 'AMMO2': '0.011', 'AMMO4': '0.053', 'AMMO3': '0.069', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.222', 'weapon4': '0.266', 'WEAPON3': '0.400', 'weapon3': '0.742', 'weapon2': '0.968'} +[2023-09-14 12:32:38,360][53804] DAMAGECOUNT value on done: 567.0 +[2023-09-14 12:32:38,360][53804] DAMAGECOUNT value on done: 582.0 +[2023-09-14 12:32:38,360][53804] Sum rewards: 3.674, reward structure: {'HEALTH': '-2.500', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.009', 'AMMO4': '0.047', 'weapon5': '0.058', 'AMMO3': '0.060', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.360', 'weapon2': '0.436', 'WEAPON3': '0.500', 'DAMAGECOUNT': '2.000', 'FRAGCOUNT': '2.000', 'weapon3': '2.296'} +[2023-09-14 12:32:38,361][53804] Sum rewards: 4.715, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.011', 'AMMO5': '0.013', 'weapon4': '0.044', 'AMMO4': '0.055', 'AMMO3': '0.070', 'WEAPON4': '0.100', 'weapon5': '0.232', 'WEAPON5': '0.300', 'WEAPON3': '0.500', 'weapon2': '0.582', 'weapon3': '1.908', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.900'} +[2023-09-14 12:32:38,952][53804] DAMAGECOUNT value on done: 225.0 +[2023-09-14 12:32:38,953][53804] DAMAGECOUNT value on done: 530.0 +[2023-09-14 12:32:38,953][53804] Sum rewards: 4.637, reward structure: {'HEALTH': '-0.250', 'AMMO4': '-0.000', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'weapon5': '0.074', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.732', 'FRAGCOUNT': '1.000', 'weapon3': '1.198', 'DAMAGECOUNT': '1.560'} +[2023-09-14 12:32:41,550][53802] Updated weights for policy 1, policy_version 190 (0.0012) +[2023-09-14 12:32:42,153][53801] Updated weights for policy 0, policy_version 912 (0.0013) +[2023-09-14 12:32:42,435][109198] Fps is (10 sec: 13516.7, 60 sec: 13380.3, 300 sec: 12609.8). Total num frames: 4517888. Throughput: 0: 1689.2, 1: 1785.4. Samples: 431505. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:32:42,437][109198] Avg episode reward: [(0, '3.094'), (1, '1.186')] +[2023-09-14 12:32:47,435][109198] Fps is (10 sec: 13107.1, 60 sec: 13585.1, 300 sec: 12627.0). Total num frames: 4583424. Throughput: 0: 1697.6, 1: 1801.1. Samples: 451130. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:32:47,436][109198] Avg episode reward: [(0, '3.094'), (1, '1.186')] +[2023-09-14 12:32:47,604][53802] Updated weights for policy 1, policy_version 200 (0.0012) +[2023-09-14 12:32:48,483][53801] Updated weights for policy 0, policy_version 922 (0.0014) +[2023-09-14 12:32:52,435][109198] Fps is (10 sec: 13516.9, 60 sec: 13858.1, 300 sec: 12670.3). Total num frames: 4653056. Throughput: 0: 1706.6, 1: 1812.9. Samples: 472214. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:32:52,436][109198] Avg episode reward: [(0, '3.094'), (1, '1.186')] +[2023-09-14 12:32:53,404][53802] Updated weights for policy 1, policy_version 210 (0.0012) +[2023-09-14 12:32:54,559][53801] Updated weights for policy 0, policy_version 932 (0.0013) +[2023-09-14 12:32:57,435][109198] Fps is (10 sec: 13926.5, 60 sec: 13926.4, 300 sec: 12710.8). Total num frames: 4722688. Throughput: 0: 1709.3, 1: 1814.0. Samples: 482730. Policy #0 lag: (min: 0.0, avg: 0.7, max: 3.0) +[2023-09-14 12:32:57,437][109198] Avg episode reward: [(0, '3.094'), (1, '1.186')] +[2023-09-14 12:32:59,265][53802] Updated weights for policy 1, policy_version 220 (0.0012) +[2023-09-14 12:33:00,796][53801] Updated weights for policy 0, policy_version 942 (0.0013) +[2023-09-14 12:33:01,216][53805] DAMAGECOUNT value on done: 83.0 +[2023-09-14 12:33:01,217][53805] DAMAGECOUNT value on done: 399.0 +[2023-09-14 12:33:01,218][53805] Sum rewards: 4.587, reward structure: {'HEALTH': '-0.640', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.104', 'WEAPON3': '0.200', 'weapon2': '0.394', 'weapon5': '0.408', 'FRAGCOUNT': '1.000', 'weapon3': '1.208', 'DAMAGECOUNT': '1.690'} +[2023-09-14 12:33:01,259][53811] DAMAGECOUNT value on done: 585.0 +[2023-09-14 12:33:01,260][53811] DAMAGECOUNT value on done: 388.0 +[2023-09-14 12:33:01,260][53811] Sum rewards: 5.067, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.006', 'AMMO5': '0.012', 'AMMO4': '0.032', 'AMMO3': '0.072', 'weapon5': '0.288', 'WEAPON5': '0.300', 'weapon2': '0.412', 'WEAPON3': '0.600', 'weapon3': '2.926', 'FRAGCOUNT': '2.998', 'DAMAGECOUNT': '3.420'} +[2023-09-14 12:33:01,261][53811] Sum rewards: 0.507, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.013', 'AMMO4': '0.064', 'weapon5': '0.068', 'AMMO3': '0.099', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.286', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.186', 'DAMAGECOUNT': '1.350', 'weapon2': '1.430'} +[2023-09-14 12:33:01,828][53811] DAMAGECOUNT value on done: 268.0 +[2023-09-14 12:33:01,828][53811] DAMAGECOUNT value on done: 351.0 +[2023-09-14 12:33:01,836][53805] DAMAGECOUNT value on done: 545.0 +[2023-09-14 12:33:01,836][53805] DAMAGECOUNT value on done: 362.0 +[2023-09-14 12:33:02,435][109198] Fps is (10 sec: 13516.8, 60 sec: 13994.7, 300 sec: 12723.2). Total num frames: 4788224. Throughput: 0: 1698.6, 1: 1797.8. Samples: 503043. Policy #0 lag: (min: 0.0, avg: 0.6, max: 1.0) +[2023-09-14 12:33:02,436][109198] Avg episode reward: [(0, '3.115'), (1, '1.203')] +[2023-09-14 12:33:02,443][53585] Saving new best policy, reward=1.203! +[2023-09-14 12:33:04,683][53807] DAMAGECOUNT value on done: 168.0 +[2023-09-14 12:33:04,683][53807] DAMAGECOUNT value on done: 80.0 +[2023-09-14 12:33:04,684][53807] Sum rewards: 1.941, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.021', 'AMMO3': '0.046', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.106', 'weapon5': '0.148', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.450', 'weapon4': '0.506', 'weapon3': '0.870', 'weapon2': '1.290'} +[2023-09-14 12:33:04,855][53802] Updated weights for policy 1, policy_version 230 (0.0012) +[2023-09-14 12:33:05,202][53807] DAMAGECOUNT value on done: 307.0 +[2023-09-14 12:33:05,202][53807] DAMAGECOUNT value on done: 484.0 +[2023-09-14 12:33:05,203][53807] Sum rewards: 1.718, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.012', 'AMMO4': '0.016', 'AMMO3': '0.079', 'WEAPON4': '0.100', 'weapon4': '0.160', 'WEAPON5': '0.300', 'weapon5': '0.308', 'WEAPON3': '0.600', 'weapon2': '0.786', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '2.020', 'weapon3': '2.334'} +[2023-09-14 12:33:05,203][53807] Sum rewards: 4.191, reward structure: {'HEALTH': '-1.970', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.018', 'AMMO3': '0.054', 'AMMO4': '0.089', 'WEAPON5': '0.100', 'weapon4': '0.132', 'WEAPON4': '0.200', 'weapon5': '0.206', 'WEAPON3': '0.400', 'weapon2': '1.142', 'weapon3': '1.186', 'DAMAGECOUNT': '1.630', 'FRAGCOUNT': '2.000'} +[2023-09-14 12:33:05,629][53807] DAMAGECOUNT value on done: 69.0 +[2023-09-14 12:33:05,629][53807] DAMAGECOUNT value on done: 233.0 +[2023-09-14 12:33:05,630][53807] Sum rewards: 1.411, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'DAMAGECOUNT': '0.040', 'AMMO3': '0.052', 'weapon5': '0.190', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '1.168', 'weapon3': '1.364'} +[2023-09-14 12:33:06,008][53808] DAMAGECOUNT value on done: 278.0 +[2023-09-14 12:33:06,008][53808] DAMAGECOUNT value on done: 356.0 +[2023-09-14 12:33:06,009][53808] Sum rewards: 2.975, reward structure: {'HEALTH': '-1.280', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'weapon2': '0.004', 'AMMO2': '0.005', 'AMMO5': '0.009', 'AMMO4': '0.025', 'AMMO3': '0.040', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.238', 'WEAPON3': '0.400', 'weapon4': '0.634', 'DAMAGECOUNT': '0.900', 'weapon3': '2.602'} +[2023-09-14 12:33:06,185][53807] DAMAGECOUNT value on done: 710.0 +[2023-09-14 12:33:06,185][53807] DAMAGECOUNT value on done: 492.0 +[2023-09-14 12:33:06,186][53807] Sum rewards: 2.236, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.014', 'AMMO3': '0.039', 'AMMO4': '0.071', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.132', 'WEAPON3': '0.300', 'weapon4': '0.316', 'DAMAGECOUNT': '0.550', 'weapon3': '1.022', 'weapon2': '1.738'} +[2023-09-14 12:33:06,496][53801] Updated weights for policy 0, policy_version 952 (0.0013) +[2023-09-14 12:33:06,543][53808] DAMAGECOUNT value on done: 357.0 +[2023-09-14 12:33:06,544][53808] DAMAGECOUNT value on done: 329.0 +[2023-09-14 12:33:06,544][53808] Sum rewards: 3.672, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.018', 'AMMO3': '0.051', 'AMMO4': '0.089', 'weapon4': '0.096', 'weapon5': '0.188', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon2': '1.024', 'DAMAGECOUNT': '1.220', 'weapon3': '1.378'} +[2023-09-14 12:33:06,545][53808] Sum rewards: 2.654, reward structure: {'HEALTH': '-1.120', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.030', 'WEAPON5': '0.100', 'weapon5': '0.188', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.450', 'FRAGCOUNT': '1.000', 'weapon2': '1.040', 'weapon3': '1.678'} +[2023-09-14 12:33:06,755][53805] DAMAGECOUNT value on done: 440.0 +[2023-09-14 12:33:06,755][53805] DAMAGECOUNT value on done: 288.0 +[2023-09-14 12:33:06,755][53805] Sum rewards: 3.667, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'weapon5': '0.100', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.630', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.200', 'weapon3': '2.286'} +[2023-09-14 12:33:06,756][53805] Sum rewards: 2.913, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.012', 'AMMO3': '0.041', 'AMMO4': '0.059', 'weapon5': '0.066', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.300', 'weapon4': '0.324', 'DAMAGECOUNT': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '1.012', 'weapon2': '1.094'} +[2023-09-14 12:33:06,985][53808] DAMAGECOUNT value on done: 325.0 +[2023-09-14 12:33:06,985][53808] DAMAGECOUNT value on done: 189.0 +[2023-09-14 12:33:06,986][53808] Sum rewards: 2.137, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.007', 'AMMO3': '0.036', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.118', 'weapon4': '0.226', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.900', 'weapon3': '1.258', 'weapon2': '1.286'} +[2023-09-14 12:33:07,430][53805] DAMAGECOUNT value on done: 425.0 +[2023-09-14 12:33:07,430][53805] DAMAGECOUNT value on done: 373.0 +[2023-09-14 12:33:07,431][53805] Sum rewards: 6.241, reward structure: {'HEALTH': '-1.750', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.030', 'AMMO3': '0.049', 'weapon5': '0.090', 'AMMO4': '0.151', 'weapon2': '0.154', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.596', 'FRAGCOUNT': '1.999', 'weapon3': '2.362', 'DAMAGECOUNT': '2.750'} +[2023-09-14 12:33:07,435][109198] Fps is (10 sec: 13926.4, 60 sec: 14062.9, 300 sec: 12784.5). Total num frames: 4861952. Throughput: 0: 1701.7, 1: 1801.2. Samples: 524864. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:33:07,436][109198] Avg episode reward: [(0, '3.105'), (1, '1.354')] +[2023-09-14 12:33:07,438][53585] Saving new best policy, reward=1.354! +[2023-09-14 12:33:07,496][53811] DAMAGECOUNT value on done: 506.0 +[2023-09-14 12:33:07,496][53811] DAMAGECOUNT value on done: 606.0 +[2023-09-14 12:33:07,497][53811] Sum rewards: 2.966, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO2': '0.007', 'AMMO4': '0.035', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'weapon2': '0.280', 'WEAPON3': '0.400', 'weapon5': '0.618', 'DAMAGECOUNT': '0.900', 'weapon3': '2.630'} +[2023-09-14 12:33:07,550][53808] DAMAGECOUNT value on done: 403.0 +[2023-09-14 12:33:07,550][53808] DAMAGECOUNT value on done: 456.0 +[2023-09-14 12:33:07,550][53808] Sum rewards: 3.789, reward structure: {'HEALTH': '-0.910', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.050', 'weapon5': '0.056', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.206', 'weapon2': '0.786', 'DAMAGECOUNT': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '1.218'} +[2023-09-14 12:33:07,890][53806] DAMAGECOUNT value on done: 374.0 +[2023-09-14 12:33:07,890][53806] DAMAGECOUNT value on done: 226.0 +[2023-09-14 12:33:07,891][53806] Sum rewards: 4.537, reward structure: {'HEALTH': '-0.640', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.016', 'AMMO3': '0.028', 'AMMO4': '0.081', 'weapon5': '0.098', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.436', 'weapon3': '0.758', 'DAMAGECOUNT': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.554'} +[2023-09-14 12:33:08,033][53811] DAMAGECOUNT value on done: 430.0 +[2023-09-14 12:33:08,034][53811] Sum rewards: 4.494, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.008', 'AMMO3': '0.040', 'AMMO4': '0.040', 'weapon5': '0.098', 'WEAPON4': '0.100', 'weapon4': '0.124', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.628', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.250', 'weapon3': '2.698'} +[2023-09-14 12:33:08,035][53811] DAMAGECOUNT value on done: 470.0 +[2023-09-14 12:33:08,035][53811] Sum rewards: 3.622, reward structure: {'HEALTH': '-1.250', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'weapon5': '0.002', 'AMMO5': '0.005', 'AMMO2': '0.028', 'AMMO3': '0.055', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.137', 'weapon4': '0.144', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon3': '1.068', 'DAMAGECOUNT': '1.100', 'weapon2': '1.732'} +[2023-09-14 12:33:08,508][53806] DAMAGECOUNT value on done: 345.0 +[2023-09-14 12:33:08,509][53806] Sum rewards: 3.803, reward structure: {'HEALTH': '-1.250', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.024', 'AMMO3': '0.043', 'weapon5': '0.084', 'WEAPON5': '0.100', 'AMMO4': '0.119', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.364', 'weapon3': '0.926', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.250', 'weapon2': '1.638'} +[2023-09-14 12:33:08,509][53806] DAMAGECOUNT value on done: 220.0 +[2023-09-14 12:33:08,509][53806] Sum rewards: 1.987, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO3': '0.055', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon4': '0.300', 'weapon5': '0.354', 'WEAPON3': '0.400', 'FRAGCOUNT': '0.999', 'weapon2': '1.090', 'weapon3': '1.240', 'DAMAGECOUNT': '1.250'} +[2023-09-14 12:33:09,209][53806] DAMAGECOUNT value on done: 373.0 +[2023-09-14 12:33:09,209][53806] DAMAGECOUNT value on done: 297.0 +[2023-09-14 12:33:09,210][53806] Sum rewards: 4.348, reward structure: {'HEALTH': '-0.430', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.019', 'AMMO4': '0.025', 'weapon5': '0.048', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.218', 'weapon2': '0.364', 'FRAGCOUNT': '1.000', 'weapon3': '1.276', 'DAMAGECOUNT': '1.420'} +[2023-09-14 12:33:09,780][53806] DAMAGECOUNT value on done: 255.0 +[2023-09-14 12:33:09,780][53806] DAMAGECOUNT value on done: 285.0 +[2023-09-14 12:33:09,781][53806] Sum rewards: 2.005, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.012', 'AMMO3': '0.022', 'AMMO4': '0.059', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.120', 'WEAPON3': '0.200', 'weapon5': '0.294', 'DAMAGECOUNT': '0.450', 'weapon3': '1.056', 'weapon2': '1.588'} +[2023-09-14 12:33:10,573][53802] Updated weights for policy 1, policy_version 240 (0.0014) +[2023-09-14 12:33:12,007][53809] DAMAGECOUNT value on done: 468.0 +[2023-09-14 12:33:12,007][53809] Sum rewards: 0.857, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.004', 'AMMO3': '0.051', 'weapon5': '0.082', 'WEAPON5': '0.100', 'WEAPON3': '0.400', 'weapon2': '0.934', 'weapon3': '1.346'} +[2023-09-14 12:33:12,007][53809] DAMAGECOUNT value on done: 200.0 +[2023-09-14 12:33:12,435][109198] Fps is (10 sec: 14336.1, 60 sec: 14062.9, 300 sec: 12818.1). Total num frames: 4931584. Throughput: 0: 1695.9, 1: 1791.8. Samples: 535279. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:33:12,437][109198] Avg episode reward: [(0, '3.080'), (1, '1.502')] +[2023-09-14 12:33:12,444][53585] Saving new best policy, reward=1.502! +[2023-09-14 12:33:12,583][53801] Updated weights for policy 0, policy_version 962 (0.0013) +[2023-09-14 12:33:12,591][53809] DAMAGECOUNT value on done: 52.0 +[2023-09-14 12:33:12,591][53809] DAMAGECOUNT value on done: 143.0 +[2023-09-14 12:33:13,164][53809] DAMAGECOUNT value on done: 335.0 +[2023-09-14 12:33:13,164][53809] DAMAGECOUNT value on done: 341.0 +[2023-09-14 12:33:13,164][53809] Sum rewards: 3.323, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.007', 'AMMO4': '0.033', 'AMMO3': '0.039', 'weapon4': '0.086', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.298', 'WEAPON3': '0.300', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.046', 'weapon2': '1.206'} +[2023-09-14 12:33:13,165][53809] Sum rewards: 3.029, reward structure: {'HEALTH': '-1.570', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.007', 'weapon2': '0.020', 'AMMO4': '0.025', 'AMMO3': '0.042', 'WEAPON4': '0.100', 'weapon5': '0.154', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.468', 'DAMAGECOUNT': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '2.528'} +[2023-09-14 12:33:13,712][53809] DAMAGECOUNT value on done: 125.0 +[2023-09-14 12:33:13,712][53809] DAMAGECOUNT value on done: 195.0 +[2023-09-14 12:33:13,713][53809] Sum rewards: 4.349, reward structure: {'HEALTH': '-0.350', 'AMMO4': '-0.000', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.136', 'WEAPON3': '0.200', 'weapon5': '0.252', 'weapon2': '0.284', 'FRAGCOUNT': '1.000', 'weapon3': '1.204', 'DAMAGECOUNT': '1.400'} +[2023-09-14 12:33:14,029][53810] DAMAGECOUNT value on done: 350.0 +[2023-09-14 12:33:14,029][53810] DAMAGECOUNT value on done: 262.0 +[2023-09-14 12:33:14,030][53810] Sum rewards: 5.000, reward structure: {'HEALTH': '-0.570', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.020', 'AMMO3': '0.020', 'AMMO4': '0.099', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.186', 'WEAPON3': '0.200', 'weapon4': '0.248', 'weapon3': '0.936', 'FRAGCOUNT': '1.000', 'weapon2': '1.208', 'DAMAGECOUNT': '1.450'} +[2023-09-14 12:33:14,584][53810] DAMAGECOUNT value on done: 385.0 +[2023-09-14 12:33:14,584][53810] DAMAGECOUNT value on done: 550.0 +[2023-09-14 12:33:14,585][53810] Sum rewards: 4.005, reward structure: {'HEALTH': '-1.650', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.016', 'AMMO3': '0.040', 'weapon2': '0.044', 'weapon5': '0.080', 'AMMO4': '0.082', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.450', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.350', 'weapon3': '2.784'} +[2023-09-14 12:33:15,074][53810] DAMAGECOUNT value on done: 294.0 +[2023-09-14 12:33:15,074][53810] DAMAGECOUNT value on done: 117.0 +[2023-09-14 12:33:15,651][53810] DAMAGECOUNT value on done: 128.0 +[2023-09-14 12:33:15,651][53810] DAMAGECOUNT value on done: 283.0 +[2023-09-14 12:33:15,652][53810] Sum rewards: 1.424, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO2': '0.004', 'AMMO5': '0.010', 'AMMO4': '0.022', 'AMMO3': '0.043', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.256', 'weapon4': '0.286', 'WEAPON3': '0.300', 'weapon3': '0.948', 'weapon2': '1.156'} +[2023-09-14 12:33:16,052][53802] Updated weights for policy 1, policy_version 250 (0.0011) +[2023-09-14 12:33:16,748][53804] DAMAGECOUNT value on done: 180.0 +[2023-09-14 12:33:16,748][53804] DAMAGECOUNT value on done: 200.0 +[2023-09-14 12:33:16,749][53804] Sum rewards: 2.188, reward structure: {'HEALTH': '-1.550', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.008', 'AMMO4': '0.034', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon5': '0.140', 'weapon4': '0.190', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.400', 'DAMAGECOUNT': '0.600', 'weapon3': '2.620'} +[2023-09-14 12:33:17,302][53804] DAMAGECOUNT value on done: 335.0 +[2023-09-14 12:33:17,302][53804] Sum rewards: 6.403, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.025', 'AMMO3': '0.049', 'WEAPON4': '0.100', 'weapon2': '0.140', 'WEAPON5': '0.200', 'weapon4': '0.336', 'WEAPON3': '0.400', 'weapon5': '0.552', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.100', 'weapon3': '2.488'} +[2023-09-14 12:33:17,302][53804] DAMAGECOUNT value on done: 344.0 +[2023-09-14 12:33:17,435][109198] Fps is (10 sec: 14336.1, 60 sec: 14063.0, 300 sec: 12873.2). Total num frames: 5005312. Throughput: 0: 1686.5, 1: 1779.1. Samples: 556161. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0) +[2023-09-14 12:33:17,436][109198] Avg episode reward: [(0, '3.105'), (1, '1.683')] +[2023-09-14 12:33:17,438][53585] Saving new best policy, reward=1.683! +[2023-09-14 12:33:17,893][53804] DAMAGECOUNT value on done: 717.0 +[2023-09-14 12:33:17,893][53804] DAMAGECOUNT value on done: 692.0 +[2023-09-14 12:33:17,894][53804] Sum rewards: 3.431, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.009', 'AMMO4': '0.022', 'AMMO3': '0.043', 'weapon2': '0.080', 'WEAPON4': '0.100', 'weapon5': '0.130', 'WEAPON5': '0.200', 'weapon4': '0.338', 'WEAPON3': '0.400', 'DAMAGECOUNT': '1.500', 'weapon3': '3.006'} +[2023-09-14 12:33:17,894][53804] Sum rewards: 2.872, reward structure: {'HEALTH': '-1.650', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.009', 'AMMO3': '0.039', 'AMMO4': '0.044', 'WEAPON4': '0.100', 'weapon2': '0.172', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.458', 'weapon4': '0.464', 'DAMAGECOUNT': '1.100', 'weapon3': '2.528'} +[2023-09-14 12:33:18,465][53801] Updated weights for policy 0, policy_version 972 (0.0013) +[2023-09-14 12:33:18,487][53804] DAMAGECOUNT value on done: 570.0 +[2023-09-14 12:33:18,488][53804] DAMAGECOUNT value on done: 240.0 +[2023-09-14 12:33:21,879][53802] Updated weights for policy 1, policy_version 260 (0.0013) +[2023-09-14 12:33:22,435][109198] Fps is (10 sec: 13926.3, 60 sec: 13994.7, 300 sec: 12879.7). Total num frames: 5070848. Throughput: 0: 1683.8, 1: 1774.6. Samples: 577527. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:33:22,436][109198] Avg episode reward: [(0, '3.061'), (1, '1.706')] +[2023-09-14 12:33:22,443][53585] Saving new best policy, reward=1.706! +[2023-09-14 12:33:23,678][53811] Large shaping reward 2.521 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 2.0), ('DAMAGECOUNT', 1.52, 152.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 12:33:24,655][53801] Updated weights for policy 0, policy_version 982 (0.0012) +[2023-09-14 12:33:27,435][109198] Fps is (10 sec: 13516.8, 60 sec: 13926.4, 300 sec: 12908.0). Total num frames: 5140480. Throughput: 0: 1684.7, 1: 1775.3. Samples: 587205. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:33:27,436][109198] Avg episode reward: [(0, '3.061'), (1, '1.706')] +[2023-09-14 12:33:27,835][53802] Updated weights for policy 1, policy_version 270 (0.0015) +[2023-09-14 12:33:30,805][53801] Updated weights for policy 0, policy_version 992 (0.0013) +[2023-09-14 12:33:32,435][109198] Fps is (10 sec: 13926.5, 60 sec: 13789.9, 300 sec: 12934.8). Total num frames: 5210112. Throughput: 0: 1696.2, 1: 1788.5. Samples: 607941. Policy #0 lag: (min: 0.0, avg: 0.5, max: 1.0) +[2023-09-14 12:33:32,436][109198] Avg episode reward: [(0, '3.061'), (1, '1.706')] +[2023-09-14 12:33:33,463][53802] Updated weights for policy 1, policy_version 280 (0.0013) +[2023-09-14 12:33:33,481][53804] Large shaping reward 2.601 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 1.0), ('DAMAGECOUNT', 1.6, 160.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 12:33:36,681][53801] Updated weights for policy 0, policy_version 1002 (0.0013) +[2023-09-14 12:33:37,435][109198] Fps is (10 sec: 13926.3, 60 sec: 13789.9, 300 sec: 12960.2). Total num frames: 5279744. Throughput: 0: 1700.2, 1: 1789.9. Samples: 629267. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:33:37,436][109198] Avg episode reward: [(0, '3.061'), (1, '1.706')] +[2023-09-14 12:33:38,748][53805] DAMAGECOUNT value on done: 413.0 +[2023-09-14 12:33:38,749][53805] Sum rewards: 5.903, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.023', 'AMMO3': '0.028', 'AMMO4': '0.117', 'weapon5': '0.142', 'WEAPON3': '0.200', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.208', 'weapon3': '0.638', 'FRAGCOUNT': '1.000', 'weapon2': '1.838', 'DAMAGECOUNT': '3.300'} +[2023-09-14 12:33:38,748][53805] DAMAGECOUNT value on done: 454.0 +[2023-09-14 12:33:38,774][53811] DAMAGECOUNT value on done: 737.0 +[2023-09-14 12:33:38,774][53811] DAMAGECOUNT value on done: 393.0 +[2023-09-14 12:33:38,775][53811] Sum rewards: 4.737, reward structure: {'HEALTH': '-0.350', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.412', 'weapon5': '0.662', 'FRAGCOUNT': '1.000', 'weapon3': '1.200', 'DAMAGECOUNT': '1.520'} +[2023-09-14 12:33:39,226][53802] Updated weights for policy 1, policy_version 290 (0.0014) +[2023-09-14 12:33:39,329][53811] DAMAGECOUNT value on done: 353.0 +[2023-09-14 12:33:39,329][53811] DAMAGECOUNT value on done: 386.0 +[2023-09-14 12:33:39,331][53805] DAMAGECOUNT value on done: 407.0 +[2023-09-14 12:33:39,332][53805] DAMAGECOUNT value on done: 605.0 +[2023-09-14 12:33:42,218][53807] DAMAGECOUNT value on done: 170.0 +[2023-09-14 12:33:42,219][53807] Sum rewards: 2.805, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.012', 'AMMO3': '0.034', 'AMMO4': '0.058', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.284', 'WEAPON3': '0.300', 'weapon4': '0.344', 'DAMAGECOUNT': '0.900', 'weapon3': '1.214', 'weapon2': '1.452'} +[2023-09-14 12:33:42,218][53807] DAMAGECOUNT value on done: 178.0 +[2023-09-14 12:33:42,435][109198] Fps is (10 sec: 13926.4, 60 sec: 13858.2, 300 sec: 12984.3). Total num frames: 5349376. Throughput: 0: 1699.6, 1: 1789.6. Samples: 639741. Policy #0 lag: (min: 0.0, avg: 0.8, max: 1.0) +[2023-09-14 12:33:42,437][109198] Avg episode reward: [(0, '3.001'), (1, '1.791')] +[2023-09-14 12:33:42,443][53585] Saving new best policy, reward=1.791! +[2023-09-14 12:33:42,840][53807] DAMAGECOUNT value on done: 509.0 +[2023-09-14 12:33:42,840][53807] DAMAGECOUNT value on done: 387.0 +[2023-09-14 12:33:42,841][53807] Sum rewards: 1.717, reward structure: {'HEALTH': '-2.050', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.002', 'HITCOUNT': '0.000', 'AMMO2': '0.006', 'AMMO5': '0.010', 'AMMO4': '0.028', 'AMMO3': '0.074', 'WEAPON5': '0.300', 'weapon2': '0.352', 'WEAPON3': '0.600', 'weapon5': '0.632', 'DAMAGECOUNT': '0.800', 'weapon3': '2.966'} +[2023-09-14 12:33:42,888][53801] Updated weights for policy 0, policy_version 1012 (0.0014) +[2023-09-14 12:33:43,345][53807] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:33:43,345][53807] DAMAGECOUNT value on done: 273.0 +[2023-09-14 12:33:43,882][53808] DAMAGECOUNT value on done: 478.0 +[2023-09-14 12:33:43,882][53808] DAMAGECOUNT value on done: 776.0 +[2023-09-14 12:33:43,883][53808] Sum rewards: 1.413, reward structure: {'DEATHCOUNT': '-4.000', 'HEALTH': '-4.000', 'HITCOUNT': '0.000', 'weapon5': '0.002', 'AMMO5': '0.020', 'AMMO2': '0.069', 'AMMO3': '0.114', 'weapon2': '0.232', 'weapon4': '0.280', 'AMMO4': '0.347', 'WEAPON5': '0.400', 'WEAPON4': '0.400', 'WEAPON3': '0.800', 'DAMAGECOUNT': '2.000', 'FRAGCOUNT': '2.000', 'weapon3': '2.748'} +[2023-09-14 12:33:43,883][53808] Sum rewards: 8.323, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.007', 'AMMO4': '0.032', 'weapon5': '0.044', 'AMMO3': '0.059', 'weapon2': '0.080', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'weapon4': '0.578', 'weapon3': '2.416', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.200'} +[2023-09-14 12:33:43,917][53807] DAMAGECOUNT value on done: 1020.0 +[2023-09-14 12:33:43,917][53807] Sum rewards: 6.723, reward structure: {'HEALTH': '-2.300', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.012', 'AMMO2': '0.017', 'weapon2': '0.018', 'AMMO3': '0.072', 'AMMO4': '0.085', 'weapon5': '0.126', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon4': '0.540', 'WEAPON3': '0.600', 'weapon3': '2.852', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.100'} +[2023-09-14 12:33:43,918][53807] DAMAGECOUNT value on done: 722.0 +[2023-09-14 12:33:43,919][53807] Sum rewards: 2.973, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'weapon5': '0.016', 'AMMO2': '0.028', 'AMMO3': '0.097', 'WEAPON5': '0.100', 'AMMO4': '0.137', 'WEAPON4': '0.300', 'weapon4': '0.386', 'WEAPON3': '0.600', 'weapon3': '1.094', 'weapon2': '1.910', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.300'} +[2023-09-14 12:33:44,520][53808] DAMAGECOUNT value on done: 422.0 +[2023-09-14 12:33:44,520][53808] DAMAGECOUNT value on done: 459.0 +[2023-09-14 12:33:44,521][53808] Sum rewards: 3.795, reward structure: {'HEALTH': '-0.650', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'weapon5': '0.078', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.368', 'FRAGCOUNT': '1.000', 'weapon3': '1.246', 'DAMAGECOUNT': '1.300'} +[2023-09-14 12:33:44,764][53805] DAMAGECOUNT value on done: 308.0 +[2023-09-14 12:33:44,766][53805] DAMAGECOUNT value on done: 713.0 +[2023-09-14 12:33:44,767][53805] Sum rewards: 6.776, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.005', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'weapon5': '0.392', 'WEAPON3': '0.400', 'weapon2': '0.788', 'FRAGCOUNT': '1.999', 'weapon3': '2.418', 'DAMAGECOUNT': '2.730'} +[2023-09-14 12:33:44,962][53808] DAMAGECOUNT value on done: 375.0 +[2023-09-14 12:33:44,962][53808] DAMAGECOUNT value on done: 202.0 +[2023-09-14 12:33:44,963][53808] Sum rewards: 1.767, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.015', 'AMMO3': '0.067', 'AMMO4': '0.076', 'DAMAGECOUNT': '0.130', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.338', 'WEAPON3': '0.400', 'weapon5': '0.404', 'weapon3': '0.738', 'weapon2': '1.590'} +[2023-09-14 12:33:45,041][53802] Updated weights for policy 1, policy_version 300 (0.0013) +[2023-09-14 12:33:45,328][53805] DAMAGECOUNT value on done: 578.0 +[2023-09-14 12:33:45,329][53805] Sum rewards: 4.128, reward structure: {'HEALTH': '-2.950', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO5': '0.013', 'AMMO4': '0.050', 'AMMO3': '0.071', 'weapon2': '0.108', 'weapon5': '0.158', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon4': '0.616', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.050', 'weapon3': '2.902'} +[2023-09-14 12:33:45,328][53805] DAMAGECOUNT value on done: 670.0 +[2023-09-14 12:33:45,330][53805] Sum rewards: 4.009, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.028', 'AMMO3': '0.042', 'weapon2': '0.076', 'AMMO4': '0.139', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'weapon5': '0.426', 'weapon4': '0.606', 'FRAGCOUNT': '1.000', 'weapon3': '2.332', 'DAMAGECOUNT': '2.450'} +[2023-09-14 12:33:45,529][53808] DAMAGECOUNT value on done: 666.0 +[2023-09-14 12:33:45,529][53808] DAMAGECOUNT value on done: 448.0 +[2023-09-14 12:33:45,530][53808] Sum rewards: 5.935, reward structure: {'HEALTH': '-0.450', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.108', 'WEAPON3': '0.200', 'weapon5': '0.290', 'weapon2': '0.382', 'weapon3': '1.082', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:33:45,682][53811] DAMAGECOUNT value on done: 528.0 +[2023-09-14 12:33:45,682][53811] DAMAGECOUNT value on done: 710.0 +[2023-09-14 12:33:45,683][53811] Sum rewards: 4.415, reward structure: {'HEALTH': '-0.220', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.442', 'weapon5': '0.510', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.040', 'weapon3': '1.350'} +[2023-09-14 12:33:46,279][53811] DAMAGECOUNT value on done: 490.0 +[2023-09-14 12:33:46,279][53811] DAMAGECOUNT value on done: 490.0 +[2023-09-14 12:33:46,280][53811] Sum rewards: 2.386, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.035', 'AMMO2': '-0.007', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'weapon5': '0.388', 'WEAPON3': '0.400', 'weapon2': '0.582', 'DAMAGECOUNT': '0.600', 'weapon3': '2.212'} +[2023-09-14 12:33:46,540][53806] DAMAGECOUNT value on done: 488.0 +[2023-09-14 12:33:46,540][53806] DAMAGECOUNT value on done: 276.0 +[2023-09-14 12:33:46,540][53806] Sum rewards: 3.943, reward structure: {'HEALTH': '-0.500', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'weapon5': '0.048', 'weapon4': '0.090', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.418', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.140', 'weapon3': '1.324'} +[2023-09-14 12:33:47,115][53806] DAMAGECOUNT value on done: 245.0 +[2023-09-14 12:33:47,116][53806] DAMAGECOUNT value on done: 482.0 +[2023-09-14 12:33:47,435][109198] Fps is (10 sec: 13926.4, 60 sec: 13926.4, 300 sec: 13007.3). Total num frames: 5419008. Throughput: 0: 1695.4, 1: 1789.2. Samples: 659853. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:33:47,436][109198] Avg episode reward: [(0, '3.252'), (1, '2.018')] +[2023-09-14 12:33:47,438][53511] Saving new best policy, reward=3.252! +[2023-09-14 12:33:47,438][53585] Saving new best policy, reward=2.018! +[2023-09-14 12:33:47,963][53806] DAMAGECOUNT value on done: 489.0 +[2023-09-14 12:33:47,964][53806] DAMAGECOUNT value on done: 452.0 +[2023-09-14 12:33:47,964][53806] Sum rewards: 4.439, reward structure: {'HEALTH': '-1.390', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.010', 'weapon2': '0.016', 'AMMO3': '0.040', 'AMMO4': '0.049', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.306', 'WEAPON3': '0.400', 'weapon4': '0.654', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.550', 'weapon3': '2.398'} +[2023-09-14 12:33:48,582][53806] DAMAGECOUNT value on done: 290.0 +[2023-09-14 12:33:48,582][53806] DAMAGECOUNT value on done: 494.0 +[2023-09-14 12:33:48,583][53806] Sum rewards: 2.248, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.067', 'weapon4': '0.096', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.296', 'WEAPON3': '0.500', 'weapon2': '1.114', 'weapon3': '1.806', 'DAMAGECOUNT': '2.090'} +[2023-09-14 12:33:49,054][53801] Updated weights for policy 0, policy_version 1022 (0.0014) +[2023-09-14 12:33:50,782][53802] Updated weights for policy 1, policy_version 310 (0.0012) +[2023-09-14 12:33:52,197][53809] DAMAGECOUNT value on done: 568.0 +[2023-09-14 12:33:52,198][53809] DAMAGECOUNT value on done: 365.0 +[2023-09-14 12:33:52,198][53809] Sum rewards: 1.658, reward structure: {'HEALTH': '-2.350', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.073', 'WEAPON4': '0.100', 'weapon4': '0.168', 'WEAPON5': '0.200', 'weapon5': '0.422', 'WEAPON3': '0.500', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '1.136', 'weapon2': '1.410'} +[2023-09-14 12:33:52,198][53809] Sum rewards: 2.364, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.005', 'AMMO4': '0.026', 'AMMO3': '0.036', 'WEAPON5': '0.100', 'weapon5': '0.124', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.392', 'FRAGCOUNT': '0.999', 'weapon3': '1.130', 'weapon2': '1.398', 'DAMAGECOUNT': '1.650'} +[2023-09-14 12:33:52,435][109198] Fps is (10 sec: 13516.7, 60 sec: 13858.1, 300 sec: 13009.7). Total num frames: 5484544. Throughput: 0: 1682.5, 1: 1774.1. Samples: 680413. Policy #0 lag: (min: 0.0, avg: 0.7, max: 1.0) +[2023-09-14 12:33:52,436][109198] Avg episode reward: [(0, '3.276'), (1, '2.054')] +[2023-09-14 12:33:52,442][53511] Saving new best policy, reward=3.276! +[2023-09-14 12:33:52,443][53585] Saving new best policy, reward=2.054! +[2023-09-14 12:33:53,029][53809] DAMAGECOUNT value on done: 147.0 +[2023-09-14 12:33:53,030][53809] DAMAGECOUNT value on done: 246.0 +[2023-09-14 12:33:53,030][53809] Sum rewards: 3.193, reward structure: {'HEALTH': '-0.950', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'weapon5': '0.158', 'WEAPON3': '0.200', 'weapon2': '0.350', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.030', 'weapon3': '1.312'} +[2023-09-14 12:33:53,516][53809] DAMAGECOUNT value on done: 400.0 +[2023-09-14 12:33:53,516][53809] DAMAGECOUNT value on done: 351.0 +[2023-09-14 12:33:54,077][53809] DAMAGECOUNT value on done: 320.0 +[2023-09-14 12:33:54,078][53809] Sum rewards: 4.351, reward structure: {'HEALTH': '-1.650', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.022', 'AMMO3': '0.052', 'WEAPON5': '0.100', 'AMMO4': '0.108', 'WEAPON4': '0.200', 'weapon4': '0.258', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon3': '1.104', 'weapon2': '1.802', 'DAMAGECOUNT': '1.950'} +[2023-09-14 12:33:54,078][53809] DAMAGECOUNT value on done: 365.0 +[2023-09-14 12:33:54,079][53809] Sum rewards: 2.948, reward structure: {'HEALTH': '-2.350', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.056', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.282', 'weapon4': '0.348', 'weapon2': '0.406', 'WEAPON3': '0.500', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.700', 'weapon3': '2.698'} +[2023-09-14 12:33:54,802][53810] DAMAGECOUNT value on done: 316.0 +[2023-09-14 12:33:54,802][53810] DAMAGECOUNT value on done: 350.0 +[2023-09-14 12:33:54,803][53810] Sum rewards: 1.553, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.039', 'WEAPON5': '0.100', 'weapon5': '0.196', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.540', 'weapon3': '1.140', 'weapon2': '1.254'} +[2023-09-14 12:33:54,803][53810] Sum rewards: 1.561, reward structure: {'HEALTH': '-1.440', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.009', 'AMMO2': '0.019', 'AMMO3': '0.054', 'AMMO4': '0.095', 'WEAPON4': '0.100', 'weapon4': '0.108', 'WEAPON5': '0.200', 'weapon5': '0.282', 'WEAPON3': '0.400', 'weapon3': '1.138', 'weapon2': '1.596'} +[2023-09-14 12:33:55,504][53810] DAMAGECOUNT value on done: 455.0 +[2023-09-14 12:33:55,505][53810] DAMAGECOUNT value on done: 624.0 +[2023-09-14 12:33:55,814][53801] Updated weights for policy 0, policy_version 1032 (0.0014) +[2023-09-14 12:33:55,929][53810] DAMAGECOUNT value on done: 364.0 +[2023-09-14 12:33:55,929][53810] DAMAGECOUNT value on done: 142.0 +[2023-09-14 12:33:55,929][53810] Sum rewards: 4.525, reward structure: {'HEALTH': '-0.700', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.033', 'weapon5': '0.076', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.163', 'WEAPON3': '0.200', 'DAMAGECOUNT': '0.250', 'weapon4': '0.472', 'weapon3': '0.832', 'FRAGCOUNT': '1.000', 'weapon2': '1.974'} +[2023-09-14 12:33:56,646][53810] DAMAGECOUNT value on done: 148.0 +[2023-09-14 12:33:56,647][53810] DAMAGECOUNT value on done: 313.0 +[2023-09-14 12:33:56,648][53810] Sum rewards: 1.973, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.010', 'AMMO3': '0.039', 'WEAPON4': '0.100', 'weapon4': '0.138', 'WEAPON5': '0.200', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.300', 'weapon5': '0.590', 'weapon3': '1.072', 'weapon2': '1.320'} +[2023-09-14 12:33:57,435][109198] Fps is (10 sec: 12287.9, 60 sec: 13653.3, 300 sec: 12973.8). Total num frames: 5541888. Throughput: 0: 1665.8, 1: 1759.2. Samples: 689403. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:33:57,437][109198] Avg episode reward: [(0, '3.255'), (1, '2.210')] +[2023-09-14 12:33:57,467][53585] Saving new best policy, reward=2.210! +[2023-09-14 12:33:57,476][53802] Updated weights for policy 1, policy_version 320 (0.0013) +[2023-09-14 12:33:58,251][53804] DAMAGECOUNT value on done: 421.0 +[2023-09-14 12:33:58,252][53804] Sum rewards: 6.325, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.025', 'AMMO3': '0.059', 'AMMO4': '0.127', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.208', 'WEAPON3': '0.400', 'weapon4': '0.554', 'weapon3': '0.836', 'weapon2': '1.396', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.410'} +[2023-09-14 12:33:58,252][53804] DAMAGECOUNT value on done: 315.0 +[2023-09-14 12:33:58,253][53804] Sum rewards: 1.062, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.013', 'AMMO4': '0.023', 'weapon2': '0.082', 'AMMO3': '0.091', 'weapon5': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.398', 'WEAPON3': '0.700', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.150', 'weapon3': '2.920'} +[2023-09-14 12:33:59,025][53804] DAMAGECOUNT value on done: 523.0 +[2023-09-14 12:33:59,025][53804] Sum rewards: 4.536, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'weapon2': '0.388', 'WEAPON3': '0.400', 'weapon5': '0.432', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.880', 'weapon3': '2.220'} +[2023-09-14 12:33:59,025][53804] DAMAGECOUNT value on done: 404.0 +[2023-09-14 12:33:59,026][53804] Sum rewards: 2.122, reward structure: {'HEALTH': '-1.880', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.012', 'AMMO3': '0.038', 'AMMO4': '0.060', 'WEAPON4': '0.100', 'weapon4': '0.256', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.600', 'weapon3': '0.886', 'FRAGCOUNT': '1.000', 'weapon2': '1.750'} +[2023-09-14 12:33:59,705][53804] DAMAGECOUNT value on done: 932.0 +[2023-09-14 12:33:59,706][53804] Sum rewards: 4.806, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.021', 'AMMO3': '0.055', 'AMMO4': '0.106', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.276', 'weapon2': '0.384', 'WEAPON3': '0.500', 'weapon4': '0.526', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150', 'weapon3': '2.380'} +[2023-09-14 12:33:59,705][53804] DAMAGECOUNT value on done: 906.0 +[2023-09-14 12:33:59,706][53804] Sum rewards: 4.265, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.056', 'WEAPON4': '0.100', 'weapon5': '0.120', 'WEAPON5': '0.200', 'weapon4': '0.220', 'weapon2': '0.404', 'WEAPON3': '0.500', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.140', 'weapon3': '2.550'} +[2023-09-14 12:34:00,299][53804] DAMAGECOUNT value on done: 340.0 +[2023-09-14 12:34:00,300][53804] DAMAGECOUNT value on done: 914.0 +[2023-09-14 12:34:00,300][53804] Sum rewards: 3.336, reward structure: {'HEALTH': '-1.940', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.022', 'AMMO3': '0.053', 'AMMO4': '0.110', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.428', 'weapon5': '0.642', 'weapon2': '0.928', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.282'} +[2023-09-14 12:34:00,301][53804] Sum rewards: 5.733, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.034', 'AMMO2': '-0.007', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'weapon5': '0.224', 'WEAPON3': '0.400', 'weapon2': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.962', 'DAMAGECOUNT': '3.440'} +[2023-09-14 12:34:02,435][109198] Fps is (10 sec: 11468.9, 60 sec: 13516.8, 300 sec: 12939.7). Total num frames: 5599232. Throughput: 0: 1630.8, 1: 1726.2. Samples: 707224. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:34:02,436][109198] Avg episode reward: [(0, '3.321'), (1, '2.286')] +[2023-09-14 12:34:02,449][53511] Saving new best policy, reward=3.321! +[2023-09-14 12:34:02,450][53585] Saving new best policy, reward=2.286! +[2023-09-14 12:34:03,323][53801] Updated weights for policy 0, policy_version 1042 (0.0015) +[2023-09-14 12:34:04,274][53802] Updated weights for policy 1, policy_version 330 (0.0013) +[2023-09-14 12:34:07,436][109198] Fps is (10 sec: 11468.2, 60 sec: 13243.6, 300 sec: 12906.9). Total num frames: 5656576. Throughput: 0: 1576.4, 1: 1670.8. Samples: 723655. Policy #0 lag: (min: 0.0, avg: 0.7, max: 3.0) +[2023-09-14 12:34:07,438][109198] Avg episode reward: [(0, '3.321'), (1, '2.286')] +[2023-09-14 12:34:10,761][53801] Updated weights for policy 0, policy_version 1052 (0.0018) +[2023-09-14 12:34:11,708][53802] Updated weights for policy 1, policy_version 340 (0.0012) +[2023-09-14 12:34:12,439][109198] Fps is (10 sec: 11464.3, 60 sec: 13038.1, 300 sec: 12875.5). Total num frames: 5713920. Throughput: 0: 1562.8, 1: 1654.6. Samples: 732000. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:34:12,442][109198] Avg episode reward: [(0, '3.321'), (1, '2.286')] +[2023-09-14 12:34:12,447][53511] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001054_4317184.pth... +[2023-09-14 12:34:12,448][53585] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000341_1396736.pth... +[2023-09-14 12:34:12,507][53511] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000672_2752512.pth +[2023-09-14 12:34:17,435][109198] Fps is (10 sec: 11059.9, 60 sec: 12697.6, 300 sec: 12828.3). Total num frames: 5767168. Throughput: 0: 1517.8, 1: 1608.6. Samples: 748630. Policy #0 lag: (min: 0.0, avg: 0.7, max: 1.0) +[2023-09-14 12:34:17,436][109198] Avg episode reward: [(0, '3.321'), (1, '2.286')] +[2023-09-14 12:34:18,260][53801] Updated weights for policy 0, policy_version 1062 (0.0016) +[2023-09-14 12:34:18,738][53802] Updated weights for policy 1, policy_version 350 (0.0012) +[2023-09-14 12:34:22,435][109198] Fps is (10 sec: 11063.6, 60 sec: 12561.1, 300 sec: 12800.0). Total num frames: 5824512. Throughput: 0: 1466.7, 1: 1555.7. Samples: 765274. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:34:22,436][109198] Avg episode reward: [(0, '3.321'), (1, '2.286')] +[2023-09-14 12:34:23,032][53811] DAMAGECOUNT value on done: 762.0 +[2023-09-14 12:34:23,032][53811] DAMAGECOUNT value on done: 408.0 +[2023-09-14 12:34:23,355][53805] DAMAGECOUNT value on done: 613.0 +[2023-09-14 12:34:23,356][53805] Sum rewards: 3.902, reward structure: {'HEALTH': '-1.350', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.019', 'AMMO3': '0.039', 'weapon5': '0.088', 'AMMO4': '0.093', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.432', 'weapon3': '0.922', 'FRAGCOUNT': '1.000', 'weapon2': '1.056', 'DAMAGECOUNT': '2.000'} +[2023-09-14 12:34:23,355][53805] DAMAGECOUNT value on done: 589.0 +[2023-09-14 12:34:23,357][53805] Sum rewards: 3.720, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'weapon5': '0.156', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.742', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.350', 'weapon3': '1.884'} +[2023-09-14 12:34:23,700][53811] DAMAGECOUNT value on done: 373.0 +[2023-09-14 12:34:23,701][53811] DAMAGECOUNT value on done: 411.0 +[2023-09-14 12:34:23,701][53811] Sum rewards: 2.642, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.027', 'AMMO3': '0.040', 'DAMAGECOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.416', 'weapon5': '1.262', 'weapon3': '2.236'} +[2023-09-14 12:34:23,701][53811] Sum rewards: 0.114, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO2': '0.015', 'AMMO3': '0.057', 'AMMO4': '0.074', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.250', 'weapon5': '0.320', 'WEAPON3': '0.400', 'weapon4': '0.436', 'weapon3': '0.984', 'weapon2': '1.174'} +[2023-09-14 12:34:24,036][53805] DAMAGECOUNT value on done: 675.0 +[2023-09-14 12:34:24,036][53805] DAMAGECOUNT value on done: 552.0 +[2023-09-14 12:34:24,037][53805] Sum rewards: 4.373, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.022', 'AMMO3': '0.040', 'AMMO4': '0.108', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.282', 'weapon5': '0.312', 'weapon4': '0.358', 'WEAPON3': '0.400', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.450', 'weapon3': '1.992'} +[2023-09-14 12:34:25,699][53802] Updated weights for policy 1, policy_version 360 (0.0013) +[2023-09-14 12:34:25,777][53801] Updated weights for policy 0, policy_version 1072 (0.0015) +[2023-09-14 12:34:26,185][53807] DAMAGECOUNT value on done: 288.0 +[2023-09-14 12:34:26,185][53807] DAMAGECOUNT value on done: 255.0 +[2023-09-14 12:34:26,186][53807] Sum rewards: 2.725, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO3': '0.031', 'WEAPON5': '0.200', 'WEAPON3': '0.300', 'weapon5': '0.312', 'weapon2': '0.410', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.100', 'weapon3': '1.396'} +[2023-09-14 12:34:26,972][53807] DAMAGECOUNT value on done: 614.0 +[2023-09-14 12:34:26,972][53807] DAMAGECOUNT value on done: 492.0 +[2023-09-14 12:34:26,973][53807] Sum rewards: 1.714, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.013', 'weapon5': '0.016', 'AMMO4': '0.064', 'AMMO3': '0.088', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon4': '0.528', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.050', 'weapon3': '1.292', 'weapon2': '1.554'} +[2023-09-14 12:34:26,973][53807] Sum rewards: 3.811, reward structure: {'HEALTH': '-1.550', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.006', 'weapon2': '0.020', 'AMMO4': '0.025', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.392', 'WEAPON3': '0.400', 'weapon4': '0.542', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '2.482'} +[2023-09-14 12:34:27,435][109198] Fps is (10 sec: 11468.8, 60 sec: 12356.3, 300 sec: 12772.8). Total num frames: 5881856. Throughput: 0: 1448.6, 1: 1541.8. Samples: 774308. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:34:27,436][109198] Avg episode reward: [(0, '3.308'), (1, '2.363')] +[2023-09-14 12:34:27,438][53585] Saving new best policy, reward=2.363! +[2023-09-14 12:34:27,598][53807] DAMAGECOUNT value on done: 85.0 +[2023-09-14 12:34:27,599][53807] DAMAGECOUNT value on done: 353.0 +[2023-09-14 12:34:27,600][53807] Sum rewards: 3.068, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.009', 'AMMO4': '0.024', 'AMMO3': '0.043', 'weapon5': '0.146', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.318', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.800', 'weapon2': '1.342', 'weapon3': '1.582'} +[2023-09-14 12:34:28,207][53808] DAMAGECOUNT value on done: 936.0 +[2023-09-14 12:34:28,207][53808] Sum rewards: 3.527, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.014', 'AMMO5': '0.015', 'AMMO3': '0.056', 'AMMO4': '0.068', 'weapon2': '0.086', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'WEAPON3': '0.500', 'weapon4': '0.590', 'weapon5': '0.652', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.600', 'weapon3': '2.346'} +[2023-09-14 12:34:28,207][53808] DAMAGECOUNT value on done: 684.0 +[2023-09-14 12:34:28,208][53808] Sum rewards: 5.107, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.041', 'WEAPON4': '0.100', 'weapon5': '0.164', 'WEAPON5': '0.200', 'weapon4': '0.200', 'weapon2': '0.390', 'WEAPON3': '0.400', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.060', 'weapon3': '2.074'} +[2023-09-14 12:34:28,240][53807] DAMAGECOUNT value on done: 1060.0 +[2023-09-14 12:34:28,240][53807] DAMAGECOUNT value on done: 812.0 +[2023-09-14 12:34:28,241][53807] Sum rewards: 0.982, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.002', 'FRAGCOUNT': '-0.002', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.069', 'weapon2': '0.080', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.400', 'weapon4': '0.450', 'weapon5': '0.520', 'WEAPON3': '0.600', 'weapon3': '2.460'} +[2023-09-14 12:34:29,018][53808] DAMAGECOUNT value on done: 512.0 +[2023-09-14 12:34:29,019][53808] DAMAGECOUNT value on done: 662.0 +[2023-09-14 12:34:29,019][53808] Sum rewards: 2.317, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'weapon5': '0.046', 'AMMO3': '0.075', 'AMMO4': '0.077', 'WEAPON5': '0.100', 'WEAPON4': '0.300', 'weapon4': '0.390', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.052', 'weapon2': '1.856'} +[2023-09-14 12:34:29,020][53808] Sum rewards: 5.822, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon5': '0.198', 'WEAPON5': '0.200', 'weapon4': '0.202', 'WEAPON3': '0.400', 'weapon2': '0.764', 'weapon3': '1.976', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.030'} +[2023-09-14 12:34:29,488][53808] DAMAGECOUNT value on done: 430.0 +[2023-09-14 12:34:29,488][53808] DAMAGECOUNT value on done: 417.0 +[2023-09-14 12:34:29,489][53808] Sum rewards: 2.037, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.033', 'weapon5': '0.068', 'AMMO3': '0.088', 'WEAPON5': '0.100', 'AMMO4': '0.163', 'weapon4': '0.268', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.550', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.330', 'weapon2': '1.532'} +[2023-09-14 12:34:29,489][53808] Sum rewards: 5.862, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO4': '0.025', 'AMMO3': '0.055', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon4': '0.380', 'WEAPON3': '0.400', 'weapon5': '0.428', 'weapon3': '0.970', 'weapon2': '1.146', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150'} +[2023-09-14 12:34:30,098][53808] DAMAGECOUNT value on done: 786.0 +[2023-09-14 12:34:30,098][53808] DAMAGECOUNT value on done: 608.0 +[2023-09-14 12:34:30,099][53808] Sum rewards: 4.210, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.318', 'weapon2': '0.370', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon5': '1.112', 'DAMAGECOUNT': '1.200', 'weapon3': '2.056'} +[2023-09-14 12:34:30,099][53808] Sum rewards: 4.167, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.041', 'WEAPON5': '0.200', 'weapon5': '0.284', 'WEAPON3': '0.400', 'weapon2': '0.734', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.600', 'weapon3': '2.000'} +[2023-09-14 12:34:30,739][53805] DAMAGECOUNT value on done: 438.0 +[2023-09-14 12:34:30,740][53805] Sum rewards: 4.537, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.015', 'AMMO3': '0.058', 'AMMO4': '0.075', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.516', 'weapon4': '0.520', 'weapon3': '0.936', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.300', 'weapon2': '1.308'} +[2023-09-14 12:34:30,740][53805] DAMAGECOUNT value on done: 738.0 +[2023-09-14 12:34:31,333][53811] DAMAGECOUNT value on done: 634.0 +[2023-09-14 12:34:31,333][53811] DAMAGECOUNT value on done: 753.0 +[2023-09-14 12:34:31,334][53811] Sum rewards: 3.123, reward structure: {'HEALTH': '-0.740', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'weapon5': '0.070', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.350', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.060', 'weapon3': '1.090'} +[2023-09-14 12:34:31,438][53805] DAMAGECOUNT value on done: 845.0 +[2023-09-14 12:34:31,439][53805] DAMAGECOUNT value on done: 683.0 +[2023-09-14 12:34:31,439][53805] Sum rewards: 5.629, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.013', 'AMMO3': '0.053', 'AMMO4': '0.064', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.380', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon3': '1.540', 'DAMAGECOUNT': '1.750', 'weapon5': '2.020'} +[2023-09-14 12:34:31,439][53805] Sum rewards: 3.408, reward structure: {'HEALTH': '-1.650', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.220', 'weapon2': '0.366', 'WEAPON3': '0.400', 'weapon5': '0.682', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '2.020'} +[2023-09-14 12:34:31,979][53811] DAMAGECOUNT value on done: 710.0 +[2023-09-14 12:34:31,979][53811] DAMAGECOUNT value on done: 640.0 +[2023-09-14 12:34:31,979][53811] Sum rewards: 4.604, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.026', 'AMMO3': '0.052', 'WEAPON5': '0.100', 'AMMO4': '0.132', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'weapon4': '0.500', 'weapon5': '0.614', 'weapon3': '1.030', 'weapon2': '1.246', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.200'} +[2023-09-14 12:34:31,980][53811] Sum rewards: 3.299, reward structure: {'HEALTH': '-2.050', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'weapon5': '0.004', 'AMMO5': '0.010', 'AMMO4': '0.014', 'AMMO3': '0.062', 'WEAPON4': '0.100', 'weapon4': '0.100', 'WEAPON5': '0.200', 'weapon2': '0.320', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.500', 'weapon3': '3.436'} +[2023-09-14 12:34:32,435][109198] Fps is (10 sec: 11059.2, 60 sec: 12083.2, 300 sec: 12730.4). Total num frames: 5935104. Throughput: 0: 1413.5, 1: 1502.7. Samples: 791081. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0) +[2023-09-14 12:34:32,436][109198] Avg episode reward: [(0, '3.351'), (1, '2.526')] +[2023-09-14 12:34:32,446][53585] Saving new best policy, reward=2.526! +[2023-09-14 12:34:32,453][53511] Saving new best policy, reward=3.351! +[2023-09-14 12:34:32,630][53802] Updated weights for policy 1, policy_version 370 (0.0013) +[2023-09-14 12:34:32,949][53806] DAMAGECOUNT value on done: 361.0 +[2023-09-14 12:34:32,949][53806] DAMAGECOUNT value on done: 498.0 +[2023-09-14 12:34:32,950][53806] Sum rewards: 0.703, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'DAMAGECOUNT': '0.100', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.636', 'weapon2': '1.066', 'weapon3': '2.286'} +[2023-09-14 12:34:33,115][53801] Updated weights for policy 0, policy_version 1082 (0.0016) +[2023-09-14 12:34:33,649][53806] DAMAGECOUNT value on done: 415.0 +[2023-09-14 12:34:33,649][53806] DAMAGECOUNT value on done: 612.0 +[2023-09-14 12:34:33,650][53806] Sum rewards: 4.332, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.010', 'AMMO4': '0.050', 'AMMO3': '0.054', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.316', 'WEAPON3': '0.400', 'weapon4': '0.404', 'FRAGCOUNT': '1.000', 'weapon3': '1.062', 'weapon2': '1.226', 'DAMAGECOUNT': '1.700'} +[2023-09-14 12:34:33,650][53806] Sum rewards: 3.944, reward structure: {'HEALTH': '-1.700', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.029', 'AMMO3': '0.056', 'AMMO4': '0.144', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.224', 'WEAPON3': '0.400', 'weapon4': '0.462', 'FRAGCOUNT': '1.000', 'weapon3': '1.064', 'DAMAGECOUNT': '1.300', 'weapon2': '1.554'} +[2023-09-14 12:34:34,516][53806] DAMAGECOUNT value on done: 714.0 +[2023-09-14 12:34:34,517][53806] DAMAGECOUNT value on done: 562.0 +[2023-09-14 12:34:34,517][53806] Sum rewards: 6.016, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.020', 'AMMO3': '0.044', 'WEAPON5': '0.100', 'AMMO4': '0.100', 'weapon5': '0.174', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.468', 'weapon2': '0.974', 'weapon3': '1.332', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.250'} +[2023-09-14 12:34:34,518][53806] Sum rewards: 2.992, reward structure: {'HEALTH': '-2.150', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.015', 'AMMO4': '0.024', 'AMMO3': '0.071', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.546', 'WEAPON3': '0.600', 'weapon5': '0.636', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '2.644'} +[2023-09-14 12:34:35,226][53806] DAMAGECOUNT value on done: 329.0 +[2023-09-14 12:34:35,227][53806] DAMAGECOUNT value on done: 559.0 +[2023-09-14 12:34:35,228][53806] Sum rewards: 2.172, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO4': '0.023', 'AMMO3': '0.030', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.248', 'weapon4': '0.276', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.650', 'weapon3': '1.196', 'weapon2': '1.242'} +[2023-09-14 12:34:37,435][109198] Fps is (10 sec: 11878.3, 60 sec: 12014.9, 300 sec: 12737.8). Total num frames: 6000640. Throughput: 0: 1382.8, 1: 1472.5. Samples: 808901. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:34:37,437][109198] Avg episode reward: [(0, '3.308'), (1, '2.580')] +[2023-09-14 12:34:37,438][53585] Saving new best policy, reward=2.580! +[2023-09-14 12:34:39,511][53802] Updated weights for policy 1, policy_version 380 (0.0013) +[2023-09-14 12:34:39,611][53809] DAMAGECOUNT value on done: 608.0 +[2023-09-14 12:34:39,612][53809] DAMAGECOUNT value on done: 485.0 +[2023-09-14 12:34:39,612][53809] Sum rewards: 5.357, reward structure: {'HEALTH': '-0.410', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.015', 'AMMO3': '0.020', 'AMMO4': '0.075', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.548', 'weapon2': '0.636', 'weapon3': '0.762', 'FRAGCOUNT': '1.000', 'weapon5': '1.108', 'DAMAGECOUNT': '1.200'} +[2023-09-14 12:34:40,293][53809] DAMAGECOUNT value on done: 346.0 +[2023-09-14 12:34:40,293][53809] DAMAGECOUNT value on done: 298.0 +[2023-09-14 12:34:40,293][53809] Sum rewards: 4.078, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.025', 'AMMO3': '0.040', 'weapon2': '0.100', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.552', 'weapon5': '0.646', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '2.300'} +[2023-09-14 12:34:40,294][53809] Sum rewards: 4.127, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.022', 'AMMO3': '0.060', 'weapon5': '0.066', 'WEAPON5': '0.100', 'AMMO4': '0.111', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.640', 'weapon3': '0.804', 'FRAGCOUNT': '1.000', 'weapon2': '1.208', 'DAMAGECOUNT': '1.510'} +[2023-09-14 12:34:40,505][53801] Updated weights for policy 0, policy_version 1092 (0.0015) +[2023-09-14 12:34:41,010][53809] DAMAGECOUNT value on done: 366.0 +[2023-09-14 12:34:41,010][53809] DAMAGECOUNT value on done: 495.0 +[2023-09-14 12:34:41,680][53809] DAMAGECOUNT value on done: 420.0 +[2023-09-14 12:34:41,680][53809] DAMAGECOUNT value on done: 409.0 +[2023-09-14 12:34:41,680][53809] Sum rewards: 3.600, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.010', 'AMMO4': '0.050', 'AMMO3': '0.055', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.252', 'WEAPON3': '0.400', 'weapon4': '0.480', 'weapon2': '0.938', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '1.006'} +[2023-09-14 12:34:42,435][109198] Fps is (10 sec: 11878.4, 60 sec: 11741.9, 300 sec: 12697.6). Total num frames: 6053888. Throughput: 0: 1376.5, 1: 1464.4. Samples: 817244. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:34:42,436][109198] Avg episode reward: [(0, '3.261'), (1, '2.684')] +[2023-09-14 12:34:42,443][53585] Saving new best policy, reward=2.684! +[2023-09-14 12:34:44,047][53810] DAMAGECOUNT value on done: 465.0 +[2023-09-14 12:34:44,048][53810] DAMAGECOUNT value on done: 356.0 +[2023-09-14 12:34:44,048][53810] Sum rewards: 0.857, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO2': '0.008', 'AMMO4': '0.039', 'AMMO3': '0.071', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.252', 'DAMAGECOUNT': '0.400', 'WEAPON3': '0.500', 'weapon5': '0.500', 'weapon2': '1.332', 'weapon3': '1.350'} +[2023-09-14 12:34:44,795][53810] DAMAGECOUNT value on done: 476.0 +[2023-09-14 12:34:44,795][53810] DAMAGECOUNT value on done: 646.0 +[2023-09-14 12:34:45,309][53810] DAMAGECOUNT value on done: 162.0 +[2023-09-14 12:34:45,310][53810] DAMAGECOUNT value on done: 519.0 +[2023-09-14 12:34:45,311][53810] Sum rewards: 4.964, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.574', 'FRAGCOUNT': '0.999', 'weapon5': '1.342', 'DAMAGECOUNT': '1.550', 'weapon3': '1.948'} +[2023-09-14 12:34:46,176][53810] DAMAGECOUNT value on done: 373.0 +[2023-09-14 12:34:46,177][53810] Sum rewards: 6.050, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.015', 'AMMO3': '0.053', 'AMMO4': '0.074', 'weapon5': '0.156', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.406', 'weapon3': '1.092', 'weapon2': '1.596', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.250'} +[2023-09-14 12:34:46,177][53810] DAMAGECOUNT value on done: 353.0 +[2023-09-14 12:34:46,178][53810] Sum rewards: -1.097, reward structure: {'HEALTH': '-3.150', 'DEATHCOUNT': '-3.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.025', 'AMMO3': '0.094', 'AMMO4': '0.125', 'weapon5': '0.136', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon4': '0.322', 'DAMAGECOUNT': '0.400', 'WEAPON3': '0.600', 'weapon3': '1.276', 'weapon2': '1.566'} +[2023-09-14 12:34:46,817][53802] Updated weights for policy 1, policy_version 390 (0.0015) +[2023-09-14 12:34:47,435][109198] Fps is (10 sec: 10240.0, 60 sec: 11400.5, 300 sec: 12643.5). Total num frames: 6103040. Throughput: 0: 1356.8, 1: 1440.6. Samples: 833110. Policy #0 lag: (min: 0.0, avg: 0.5, max: 1.0) +[2023-09-14 12:34:47,437][109198] Avg episode reward: [(0, '3.271'), (1, '2.725')] +[2023-09-14 12:34:47,475][53585] Saving new best policy, reward=2.725! +[2023-09-14 12:34:48,035][53801] Updated weights for policy 0, policy_version 1102 (0.0014) +[2023-09-14 12:34:48,195][53804] DAMAGECOUNT value on done: 530.0 +[2023-09-14 12:34:48,195][53804] DAMAGECOUNT value on done: 552.0 +[2023-09-14 12:34:48,196][53804] Sum rewards: 2.189, reward structure: {'HEALTH': '-2.220', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.021', 'AMMO3': '0.096', 'AMMO4': '0.107', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon4': '0.542', 'WEAPON3': '0.600', 'weapon5': '0.758', 'weapon2': '0.788', 'weapon3': '0.896', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.090'} +[2023-09-14 12:34:48,196][53804] Sum rewards: 6.515, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.011', 'AMMO3': '0.040', 'AMMO4': '0.055', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.330', 'weapon2': '0.378', 'weapon5': '0.380', 'WEAPON3': '0.400', 'FRAGCOUNT': '2.000', 'weapon3': '2.244', 'DAMAGECOUNT': '2.370'} +[2023-09-14 12:34:48,891][53804] DAMAGECOUNT value on done: 528.0 +[2023-09-14 12:34:48,892][53804] DAMAGECOUNT value on done: 479.0 +[2023-09-14 12:34:49,560][53804] DAMAGECOUNT value on done: 1126.0 +[2023-09-14 12:34:49,560][53804] Sum rewards: 3.239, reward structure: {'HEALTH': '-2.700', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO4': '0.002', 'AMMO5': '0.015', 'AMMO3': '0.053', 'WEAPON4': '0.100', 'weapon4': '0.234', 'WEAPON5': '0.300', 'weapon5': '0.362', 'WEAPON3': '0.500', 'weapon2': '0.764', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '2.200', 'weapon3': '2.410'} +[2023-09-14 12:34:49,560][53804] DAMAGECOUNT value on done: 1107.0 +[2023-09-14 12:34:49,561][53804] Sum rewards: 2.273, reward structure: {'HEALTH': '-2.950', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.008', 'AMMO5': '0.011', 'AMMO4': '0.041', 'AMMO3': '0.059', 'WEAPON4': '0.200', 'weapon2': '0.276', 'WEAPON5': '0.300', 'WEAPON3': '0.500', 'weapon5': '0.500', 'weapon4': '0.604', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.750', 'weapon3': '1.974'} +[2023-09-14 12:34:50,141][53804] DAMAGECOUNT value on done: 979.0 +[2023-09-14 12:34:50,142][53804] DAMAGECOUNT value on done: 360.0 +[2023-09-14 12:34:50,142][53804] Sum rewards: 2.408, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.017', 'AMMO3': '0.050', 'AMMO4': '0.083', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.276', 'WEAPON3': '0.400', 'weapon4': '0.640', 'weapon2': '1.026', 'weapon3': '1.308'} +[2023-09-14 12:34:52,435][109198] Fps is (10 sec: 11878.4, 60 sec: 11468.8, 300 sec: 12667.3). Total num frames: 6172672. Throughput: 0: 1392.2, 1: 1476.1. Samples: 852727. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:34:52,436][109198] Avg episode reward: [(0, '3.332'), (1, '2.770')] +[2023-09-14 12:34:52,445][53585] Saving new best policy, reward=2.770! +[2023-09-14 12:34:52,916][53802] Updated weights for policy 1, policy_version 400 (0.0012) +[2023-09-14 12:34:54,479][53801] Updated weights for policy 0, policy_version 1112 (0.0013) +[2023-09-14 12:34:57,435][109198] Fps is (10 sec: 13107.3, 60 sec: 11537.1, 300 sec: 12660.4). Total num frames: 6234112. Throughput: 0: 1404.3, 1: 1487.7. Samples: 862127. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:34:57,437][109198] Avg episode reward: [(0, '3.332'), (1, '2.770')] +[2023-09-14 12:34:59,805][53802] Updated weights for policy 1, policy_version 410 (0.0013) +[2023-09-14 12:35:01,688][53809] Large shaping reward 2.602 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 1.0), ('DAMAGECOUNT', 1.6, 160.0), ('weapon5', 0.002)] +[2023-09-14 12:35:01,852][53801] Updated weights for policy 0, policy_version 1122 (0.0015) +[2023-09-14 12:35:02,435][109198] Fps is (10 sec: 11468.7, 60 sec: 11468.8, 300 sec: 12624.5). Total num frames: 6287360. Throughput: 0: 1410.4, 1: 1493.2. Samples: 879291. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:35:02,436][109198] Avg episode reward: [(0, '3.332'), (1, '2.770')] +[2023-09-14 12:35:06,278][53802] Updated weights for policy 1, policy_version 420 (0.0012) +[2023-09-14 12:35:07,435][109198] Fps is (10 sec: 11878.2, 60 sec: 11605.4, 300 sec: 12632.9). Total num frames: 6352896. Throughput: 0: 1428.4, 1: 1512.3. Samples: 897604. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:35:07,437][109198] Avg episode reward: [(0, '3.332'), (1, '2.770')] +[2023-09-14 12:35:08,198][53811] DAMAGECOUNT value on done: 947.0 +[2023-09-14 12:35:08,199][53811] DAMAGECOUNT value on done: 615.0 +[2023-09-14 12:35:08,199][53811] Sum rewards: 3.730, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.010', 'AMMO4': '0.020', 'AMMO3': '0.060', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.242', 'weapon2': '0.390', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon5': '1.128', 'DAMAGECOUNT': '1.850', 'weapon3': '2.126'} +[2023-09-14 12:35:08,199][53811] Sum rewards: 4.051, reward structure: {'HEALTH': '-2.150', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.009', 'AMMO4': '0.043', 'AMMO3': '0.047', 'WEAPON5': '0.100', 'weapon5': '0.222', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'weapon4': '0.532', 'weapon2': '1.068', 'weapon3': '1.406', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.070'} +[2023-09-14 12:35:08,466][53805] DAMAGECOUNT value on done: 723.0 +[2023-09-14 12:35:08,466][53805] DAMAGECOUNT value on done: 794.0 +[2023-09-14 12:35:08,467][53805] Sum rewards: 2.135, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.027', 'AMMO3': '0.054', 'WEAPON5': '0.100', 'AMMO4': '0.133', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.474', 'weapon4': '0.538', 'FRAGCOUNT': '1.000', 'weapon3': '1.014', 'weapon2': '1.090', 'DAMAGECOUNT': '1.100'} +[2023-09-14 12:35:08,467][53805] Sum rewards: 5.519, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'weapon4': '0.010', 'AMMO2': '0.015', 'AMMO3': '0.040', 'weapon5': '0.068', 'AMMO4': '0.073', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon2': '0.386', 'WEAPON3': '0.400', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050', 'weapon3': '2.170'} +[2023-09-14 12:35:08,808][53801] Updated weights for policy 0, policy_version 1132 (0.0016) +[2023-09-14 12:35:09,016][53811] DAMAGECOUNT value on done: 473.0 +[2023-09-14 12:35:09,016][53811] DAMAGECOUNT value on done: 516.0 +[2023-09-14 12:35:09,017][53811] Sum rewards: 4.266, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.204', 'WEAPON3': '0.400', 'weapon2': '0.426', 'weapon5': '0.988', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.930'} +[2023-09-14 12:35:09,017][53811] Sum rewards: 3.660, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'AMMO3': '0.039', 'AMMO4': '0.072', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon5': '0.448', 'weapon4': '0.516', 'weapon3': '0.934', 'weapon2': '0.980', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050'} +[2023-09-14 12:35:09,270][53805] DAMAGECOUNT value on done: 785.0 +[2023-09-14 12:35:09,271][53805] DAMAGECOUNT value on done: 707.0 +[2023-09-14 12:35:09,271][53805] Sum rewards: 4.071, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.036', 'AMMO2': '-0.007', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.526', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.100', 'weapon5': '1.424', 'weapon3': '2.016'} +[2023-09-14 12:35:09,559][53807] DAMAGECOUNT value on done: 343.0 +[2023-09-14 12:35:09,559][53807] DAMAGECOUNT value on done: 255.0 +[2023-09-14 12:35:09,560][53807] Sum rewards: 3.024, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.008', 'AMMO4': '0.009', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon2': '0.282', 'weapon4': '0.346', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.550', 'weapon5': '1.082', 'weapon3': '2.006'} +[2023-09-14 12:35:10,238][53807] DAMAGECOUNT value on done: 714.0 +[2023-09-14 12:35:10,239][53807] DAMAGECOUNT value on done: 532.0 +[2023-09-14 12:35:10,239][53807] Sum rewards: 4.026, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.015', 'AMMO3': '0.046', 'AMMO4': '0.075', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.288', 'WEAPON3': '0.400', 'weapon2': '0.462', 'weapon4': '0.744', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '1.588'} +[2023-09-14 12:35:10,240][53807] Sum rewards: 0.873, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.021', 'AMMO3': '0.078', 'AMMO4': '0.102', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon5': '0.318', 'weapon4': '0.358', 'DAMAGECOUNT': '0.400', 'weapon2': '0.488', 'WEAPON3': '0.600', 'weapon3': '1.994'} +[2023-09-14 12:35:10,879][53807] DAMAGECOUNT value on done: 230.0 +[2023-09-14 12:35:10,880][53807] DAMAGECOUNT value on done: 468.0 +[2023-09-14 12:35:10,880][53807] Sum rewards: 1.441, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.006', 'AMMO4': '0.028', 'AMMO3': '0.064', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.166', 'weapon4': '0.396', 'WEAPON3': '0.500', 'weapon2': '0.832', 'DAMAGECOUNT': '1.450', 'weapon3': '1.796'} +[2023-09-14 12:35:10,881][53807] Sum rewards: 3.444, reward structure: {'HEALTH': '-1.800', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.010', 'AMMO3': '0.044', 'AMMO4': '0.049', 'WEAPON5': '0.100', 'weapon5': '0.128', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.702', 'weapon2': '0.758', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.150', 'weapon3': '1.700'} +[2023-09-14 12:35:11,631][53807] DAMAGECOUNT value on done: 1270.0 +[2023-09-14 12:35:11,632][53807] Sum rewards: 5.947, reward structure: {'HEALTH': '-1.750', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.009', 'AMMO4': '0.020', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon4': '0.150', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.710', 'weapon5': '0.822', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.100', 'weapon3': '2.142'} +[2023-09-14 12:35:11,632][53807] DAMAGECOUNT value on done: 922.0 +[2023-09-14 12:35:11,634][53807] Sum rewards: -0.352, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.027', 'AMMO3': '0.090', 'AMMO4': '0.135', 'WEAPON4': '0.200', 'weapon5': '0.242', 'WEAPON5': '0.300', 'weapon4': '0.434', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.100', 'weapon2': '1.146', 'weapon3': '1.360'} +[2023-09-14 12:35:12,366][53808] DAMAGECOUNT value on done: 1041.0 +[2023-09-14 12:35:12,367][53808] DAMAGECOUNT value on done: 729.0 +[2023-09-14 12:35:12,367][53808] Sum rewards: 4.377, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.010', 'AMMO3': '0.048', 'AMMO4': '0.050', 'weapon2': '0.124', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.702', 'weapon5': '0.856', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '1.728'} +[2023-09-14 12:35:12,435][109198] Fps is (10 sec: 11878.3, 60 sec: 11537.8, 300 sec: 12598.7). Total num frames: 6406144. Throughput: 0: 1421.7, 1: 1501.7. Samples: 905861. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:35:12,437][109198] Avg episode reward: [(0, '3.347'), (1, '2.805')] +[2023-09-14 12:35:12,443][53585] Saving new best policy, reward=2.805! +[2023-09-14 12:35:13,008][53808] DAMAGECOUNT value on done: 752.0 +[2023-09-14 12:35:13,009][53808] Sum rewards: 3.559, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.044', 'WEAPON5': '0.200', 'weapon2': '0.356', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.900', 'weapon3': '1.654', 'weapon5': '2.026'} +[2023-09-14 12:35:13,009][53808] DAMAGECOUNT value on done: 562.0 +[2023-09-14 12:35:13,469][53802] Updated weights for policy 1, policy_version 430 (0.0013) +[2023-09-14 12:35:13,518][53808] DAMAGECOUNT value on done: 593.0 +[2023-09-14 12:35:13,518][53808] DAMAGECOUNT value on done: 475.0 +[2023-09-14 12:35:13,518][53808] Sum rewards: 3.764, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.005', 'AMMO4': '0.025', 'weapon5': '0.050', 'AMMO3': '0.057', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.438', 'weapon4': '0.544', 'FRAGCOUNT': '0.999', 'weapon3': '1.182', 'DAMAGECOUNT': '1.760'} +[2023-09-14 12:35:14,120][53808] DAMAGECOUNT value on done: 1073.0 +[2023-09-14 12:35:14,121][53808] DAMAGECOUNT value on done: 896.0 +[2023-09-14 12:35:14,121][53808] Sum rewards: 8.546, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO3': '0.072', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.696', 'weapon5': '0.762', 'weapon3': '2.512', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '4.650'} +[2023-09-14 12:35:14,122][53808] Sum rewards: -0.772, reward structure: {'DEATHCOUNT': '-4.000', 'HEALTH': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.017', 'AMMO5': '0.017', 'AMMO4': '0.087', 'weapon5': '0.104', 'AMMO3': '0.106', 'WEAPON4': '0.200', 'weapon4': '0.234', 'WEAPON5': '0.400', 'weapon2': '0.414', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '2.748'} +[2023-09-14 12:35:15,052][53805] DAMAGECOUNT value on done: 808.0 +[2023-09-14 12:35:15,053][53805] DAMAGECOUNT value on done: 643.0 +[2023-09-14 12:35:15,053][53805] Sum rewards: 5.517, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.014', 'AMMO3': '0.036', 'AMMO4': '0.069', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.300', 'weapon4': '0.460', 'weapon5': '0.490', 'weapon2': '0.780', 'weapon3': '1.114', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:35:15,822][53805] DAMAGECOUNT value on done: 1150.0 +[2023-09-14 12:35:15,822][53805] DAMAGECOUNT value on done: 938.0 +[2023-09-14 12:35:15,823][53805] Sum rewards: 3.087, reward structure: {'HEALTH': '-4.450', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.037', 'weapon2': '0.046', 'weapon5': '0.096', 'AMMO3': '0.127', 'AMMO4': '0.183', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'weapon4': '0.618', 'WEAPON3': '0.900', 'weapon3': '2.762', 'FRAGCOUNT': '2.998', 'DAMAGECOUNT': '3.050'} +[2023-09-14 12:35:15,823][53805] Sum rewards: 3.694, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.008', 'AMMO5': '0.015', 'weapon2': '0.040', 'AMMO4': '0.040', 'AMMO3': '0.078', 'WEAPON4': '0.200', 'weapon5': '0.204', 'weapon4': '0.264', 'WEAPON5': '0.300', 'WEAPON3': '0.700', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.550', 'weapon3': '3.294'} +[2023-09-14 12:35:15,923][53811] DAMAGECOUNT value on done: 934.0 +[2023-09-14 12:35:15,923][53811] DAMAGECOUNT value on done: 1043.0 +[2023-09-14 12:35:15,924][53811] Sum rewards: 6.452, reward structure: {'HEALTH': '-2.750', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.006', 'AMMO2': '0.013', 'AMMO5': '0.015', 'AMMO4': '0.065', 'AMMO3': '0.073', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.390', 'WEAPON3': '0.600', 'weapon5': '0.762', 'weapon3': '2.678', 'DAMAGECOUNT': '3.000', 'FRAGCOUNT': '3.000'} +[2023-09-14 12:35:15,924][53811] Sum rewards: 4.317, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.027', 'weapon5': '0.082', 'AMMO3': '0.099', 'weapon2': '0.102', 'AMMO4': '0.133', 'WEAPON4': '0.200', 'weapon4': '0.344', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.900', 'weapon3': '3.210'} +[2023-09-14 12:35:15,926][53801] Updated weights for policy 0, policy_version 1142 (0.0014) +[2023-09-14 12:35:16,539][53811] DAMAGECOUNT value on done: 644.0 +[2023-09-14 12:35:16,539][53811] DAMAGECOUNT value on done: 790.0 +[2023-09-14 12:35:16,540][53811] Sum rewards: 3.044, reward structure: {'HEALTH': '-1.040', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.009', 'AMMO3': '0.036', 'AMMO4': '0.037', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'WEAPON3': '0.300', 'weapon5': '0.324', 'weapon4': '0.412', 'weapon2': '0.704', 'DAMAGECOUNT': '0.800', 'FRAGCOUNT': '0.999', 'weapon3': '1.156'} +[2023-09-14 12:35:17,435][109198] Fps is (10 sec: 11878.5, 60 sec: 11741.9, 300 sec: 12607.4). Total num frames: 6471680. Throughput: 0: 1432.9, 1: 1513.1. Samples: 923650. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0) +[2023-09-14 12:35:17,436][109198] Avg episode reward: [(0, '3.408'), (1, '2.826')] +[2023-09-14 12:35:17,438][53511] Saving new best policy, reward=3.408! +[2023-09-14 12:35:17,439][53585] Saving new best policy, reward=2.826! +[2023-09-14 12:35:19,368][53806] DAMAGECOUNT value on done: 503.0 +[2023-09-14 12:35:19,368][53806] DAMAGECOUNT value on done: 366.0 +[2023-09-14 12:35:19,573][53802] Updated weights for policy 1, policy_version 440 (0.0013) +[2023-09-14 12:35:20,033][53806] DAMAGECOUNT value on done: 455.0 +[2023-09-14 12:35:20,034][53806] DAMAGECOUNT value on done: 657.0 +[2023-09-14 12:35:20,724][53806] DAMAGECOUNT value on done: 919.0 +[2023-09-14 12:35:20,724][53806] Sum rewards: 4.333, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.011', 'AMMO4': '0.055', 'AMMO3': '0.088', 'weapon5': '0.154', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.566', 'WEAPON3': '0.600', 'weapon2': '0.772', 'weapon3': '1.630', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:35:20,725][53806] DAMAGECOUNT value on done: 662.0 +[2023-09-14 12:35:20,725][53806] Sum rewards: 2.521, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'weapon4': '0.036', 'AMMO3': '0.051', 'AMMO4': '0.099', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.400', 'weapon2': '0.748', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon5': '1.308', 'weapon3': '1.654'} +[2023-09-14 12:35:21,502][53806] DAMAGECOUNT value on done: 439.0 +[2023-09-14 12:35:21,503][53806] Sum rewards: 3.387, reward structure: {'HEALTH': '-1.350', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO4': '0.025', 'weapon5': '0.040', 'AMMO3': '0.047', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.504', 'weapon2': '0.640', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '1.670'} +[2023-09-14 12:35:21,503][53806] DAMAGECOUNT value on done: 704.0 +[2023-09-14 12:35:21,504][53806] Sum rewards: 4.035, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.005', 'AMMO4': '0.024', 'AMMO3': '0.049', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon5': '0.316', 'weapon4': '0.350', 'WEAPON3': '0.400', 'weapon2': '0.834', 'FRAGCOUNT': '1.000', 'weapon3': '1.402', 'DAMAGECOUNT': '1.450'} +[2023-09-14 12:35:22,435][109198] Fps is (10 sec: 12697.8, 60 sec: 11810.1, 300 sec: 12815.6). Total num frames: 6533120. Throughput: 0: 1446.1, 1: 1523.5. Samples: 942534. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:35:22,436][109198] Avg episode reward: [(0, '3.378'), (1, '2.836')] +[2023-09-14 12:35:22,443][53585] Saving new best policy, reward=2.836! +[2023-09-14 12:35:22,595][53801] Updated weights for policy 0, policy_version 1152 (0.0014) +[2023-09-14 12:35:24,716][53809] DAMAGECOUNT value on done: 485.0 +[2023-09-14 12:35:24,717][53809] Sum rewards: 1.498, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.005', 'AMMO3': '0.040', 'WEAPON5': '0.100', 'weapon5': '0.136', 'WEAPON3': '0.400', 'weapon2': '0.950', 'weapon3': '1.928'} +[2023-09-14 12:35:24,717][53809] DAMAGECOUNT value on done: 633.0 +[2023-09-14 12:35:24,718][53809] Sum rewards: 2.171, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.026', 'AMMO3': '0.050', 'WEAPON4': '0.100', 'AMMO4': '0.130', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.250', 'weapon5': '0.378', 'WEAPON3': '0.400', 'weapon4': '0.622', 'weapon2': '0.816', 'weapon3': '1.190'} +[2023-09-14 12:35:25,257][53809] DAMAGECOUNT value on done: 403.0 +[2023-09-14 12:35:25,257][53809] DAMAGECOUNT value on done: 446.0 +[2023-09-14 12:35:25,258][53809] Sum rewards: 3.393, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.026', 'WEAPON5': '0.100', 'AMMO4': '0.128', 'WEAPON3': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.328', 'weapon5': '0.454', 'weapon3': '0.934', 'weapon2': '0.948', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050'} +[2023-09-14 12:35:25,258][53809] Sum rewards: 4.667, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.025', 'AMMO3': '0.047', 'weapon2': '0.052', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.348', 'WEAPON3': '0.400', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.698', 'weapon5': '1.782'} +[2023-09-14 12:35:25,841][53802] Updated weights for policy 1, policy_version 450 (0.0014) +[2023-09-14 12:35:25,921][53809] DAMAGECOUNT value on done: 646.0 +[2023-09-14 12:35:25,922][53809] DAMAGECOUNT value on done: 575.0 +[2023-09-14 12:35:25,922][53809] Sum rewards: 7.167, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.047', 'AMMO2': '-0.009', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.672', 'weapon5': '1.380', 'weapon3': '1.874', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.800'} +[2023-09-14 12:35:26,566][53809] DAMAGECOUNT value on done: 505.0 +[2023-09-14 12:35:26,566][53809] DAMAGECOUNT value on done: 514.0 +[2023-09-14 12:35:26,567][53809] Sum rewards: 2.983, reward structure: {'HEALTH': '-2.150', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.013', 'AMMO4': '0.013', 'weapon4': '0.056', 'AMMO3': '0.069', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'weapon2': '0.408', 'WEAPON3': '0.600', 'weapon5': '0.874', 'FRAGCOUNT': '0.998', 'DAMAGECOUNT': '1.050', 'weapon3': '2.648'} +[2023-09-14 12:35:27,435][109198] Fps is (10 sec: 12697.6, 60 sec: 11946.7, 300 sec: 13010.0). Total num frames: 6598656. Throughput: 0: 1466.1, 1: 1545.1. Samples: 952747. Policy #0 lag: (min: 0.0, avg: 0.6, max: 1.0) +[2023-09-14 12:35:27,437][109198] Avg episode reward: [(0, '3.439'), (1, '2.818')] +[2023-09-14 12:35:27,438][53511] Saving new best policy, reward=3.439! +[2023-09-14 12:35:29,152][53801] Updated weights for policy 0, policy_version 1162 (0.0014) +[2023-09-14 12:35:29,663][53810] DAMAGECOUNT value on done: 610.0 +[2023-09-14 12:35:29,664][53810] DAMAGECOUNT value on done: 356.0 +[2023-09-14 12:35:29,664][53810] Sum rewards: 4.699, reward structure: {'HEALTH': '-0.890', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.302', 'weapon2': '0.490', 'weapon5': '0.792', 'FRAGCOUNT': '1.000', 'weapon3': '1.102', 'DAMAGECOUNT': '1.450'} +[2023-09-14 12:35:30,215][53810] DAMAGECOUNT value on done: 546.0 +[2023-09-14 12:35:30,216][53810] DAMAGECOUNT value on done: 781.0 +[2023-09-14 12:35:30,217][53810] Sum rewards: 4.743, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.006', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.310', 'weapon2': '0.356', 'WEAPON3': '0.400', 'weapon5': '0.680', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.350', 'weapon3': '2.292'} +[2023-09-14 12:35:30,693][53810] DAMAGECOUNT value on done: 519.0 +[2023-09-14 12:35:30,694][53810] DAMAGECOUNT value on done: 198.0 +[2023-09-14 12:35:31,511][53810] DAMAGECOUNT value on done: 438.0 +[2023-09-14 12:35:31,512][53810] DAMAGECOUNT value on done: 503.0 +[2023-09-14 12:35:31,512][53810] Sum rewards: 0.566, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.008', 'AMMO4': '0.026', 'AMMO3': '0.067', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.294', 'weapon2': '0.478', 'WEAPON3': '0.500', 'weapon4': '0.534', 'DAMAGECOUNT': '0.650', 'weapon3': '1.604'} +[2023-09-14 12:35:31,513][53810] Sum rewards: 4.773, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.018', 'AMMO3': '0.039', 'AMMO4': '0.088', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.460', 'weapon5': '0.936', 'FRAGCOUNT': '0.999', 'weapon2': '1.028', 'weapon3': '1.102', 'DAMAGECOUNT': '1.500'} +[2023-09-14 12:35:32,059][53802] Updated weights for policy 1, policy_version 460 (0.0012) +[2023-09-14 12:35:32,435][109198] Fps is (10 sec: 13107.1, 60 sec: 12151.4, 300 sec: 12996.1). Total num frames: 6664192. Throughput: 0: 1500.9, 1: 1581.0. Samples: 971794. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:35:32,436][109198] Avg episode reward: [(0, '3.480'), (1, '2.819')] +[2023-09-14 12:35:32,442][53511] Saving new best policy, reward=3.480! +[2023-09-14 12:35:33,717][53804] DAMAGECOUNT value on done: 560.0 +[2023-09-14 12:35:33,717][53804] DAMAGECOUNT value on done: 672.0 +[2023-09-14 12:35:33,718][53804] Sum rewards: 4.834, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.015', 'weapon2': '0.020', 'AMMO3': '0.040', 'AMMO4': '0.074', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.718', 'FRAGCOUNT': '0.999', 'weapon5': '1.126', 'DAMAGECOUNT': '1.200', 'weapon3': '1.982'} +[2023-09-14 12:35:34,392][53804] DAMAGECOUNT value on done: 489.0 +[2023-09-14 12:35:34,392][53804] DAMAGECOUNT value on done: 528.0 +[2023-09-14 12:35:35,063][53804] DAMAGECOUNT value on done: 1222.0 +[2023-09-14 12:35:35,063][53804] DAMAGECOUNT value on done: 1271.0 +[2023-09-14 12:35:35,064][53804] Sum rewards: 4.569, reward structure: {'HEALTH': '-1.450', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO2': '0.009', 'AMMO5': '0.010', 'AMMO3': '0.041', 'AMMO4': '0.046', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.238', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon5': '1.824', 'weapon3': '1.898'} +[2023-09-14 12:35:35,064][53804] Sum rewards: 2.525, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.017', 'weapon4': '0.056', 'AMMO3': '0.068', 'AMMO4': '0.084', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'WEAPON3': '0.500', 'weapon5': '0.500', 'weapon2': '0.840', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.450', 'weapon3': '1.596'} +[2023-09-14 12:35:35,595][53801] Updated weights for policy 0, policy_version 1172 (0.0014) +[2023-09-14 12:35:35,803][53804] DAMAGECOUNT value on done: 370.0 +[2023-09-14 12:35:35,803][53804] Sum rewards: 2.077, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.008', 'AMMO4': '0.040', 'AMMO3': '0.048', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.100', 'WEAPON3': '0.400', 'weapon4': '0.444', 'weapon2': '0.594', 'FRAGCOUNT': '1.000', 'weapon3': '1.542'} +[2023-09-14 12:35:35,804][53804] DAMAGECOUNT value on done: 1109.0 +[2023-09-14 12:35:35,804][53804] Sum rewards: 4.197, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.009', 'weapon4': '0.034', 'AMMO4': '0.044', 'AMMO3': '0.044', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.302', 'WEAPON3': '0.400', 'weapon2': '0.710', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.300', 'weapon3': '2.046'} +[2023-09-14 12:35:37,435][109198] Fps is (10 sec: 12697.6, 60 sec: 12083.2, 300 sec: 12982.2). Total num frames: 6725632. Throughput: 0: 1498.3, 1: 1581.2. Samples: 991302. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:35:37,436][109198] Avg episode reward: [(0, '3.499'), (1, '2.833')] +[2023-09-14 12:35:37,438][53511] Saving new best policy, reward=3.499! +[2023-09-14 12:35:38,261][53802] Updated weights for policy 1, policy_version 470 (0.0018) +[2023-09-14 12:35:41,850][53801] Updated weights for policy 0, policy_version 1182 (0.0016) +[2023-09-14 12:35:42,435][109198] Fps is (10 sec: 13107.2, 60 sec: 12356.3, 300 sec: 12982.2). Total num frames: 6795264. Throughput: 0: 1503.9, 1: 1588.4. Samples: 1001282. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:35:42,437][109198] Avg episode reward: [(0, '3.499'), (1, '2.833')] +[2023-09-14 12:35:44,214][53802] Updated weights for policy 1, policy_version 480 (0.0012) +[2023-09-14 12:35:45,177][109198] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 109198], exiting... +[2023-09-14 12:35:45,179][53511] Stopping Batcher_0... +[2023-09-14 12:35:45,179][53511] Loop batcher_evt_loop terminating... +[2023-09-14 12:35:45,179][53585] Stopping Batcher_1... +[2023-09-14 12:35:45,180][53585] Loop batcher_evt_loop terminating... +[2023-09-14 12:35:45,179][109198] Runner profile tree view: +main_loop: 330.5015 +[2023-09-14 12:35:45,181][53585] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000481_1970176.pth... +[2023-09-14 12:35:45,180][109198] Collected {0: 4857856, 1: 1970176}, FPS: 12331.3 +[2023-09-14 12:35:45,206][53802] Weights refcount: 2 0 +[2023-09-14 12:35:45,207][53801] Weights refcount: 2 0 +[2023-09-14 12:35:45,208][53802] Stopping InferenceWorker_p1-w0... +[2023-09-14 12:35:45,208][53802] Loop inference_proc1-0_evt_loop terminating... +[2023-09-14 12:35:45,208][53801] Stopping InferenceWorker_p0-w0... +[2023-09-14 12:35:45,208][53801] Loop inference_proc0-0_evt_loop terminating... +[2023-09-14 12:35:45,218][53511] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001187_4861952.pth... +[2023-09-14 12:35:45,236][53585] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000137_561152.pth +[2023-09-14 12:35:45,243][53585] Stopping LearnerWorker_p1... +[2023-09-14 12:35:45,243][53585] Loop learner_proc1_evt_loop terminating... +[2023-09-14 12:35:45,270][53511] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000861_3526656.pth +[2023-09-14 12:35:45,276][53511] Stopping LearnerWorker_p0... +[2023-09-14 12:35:45,276][53511] Loop learner_proc0_evt_loop terminating... +[2023-09-14 12:35:45,984][53804] Stopping RolloutWorker_w0... +[2023-09-14 12:35:45,984][53804] Loop rollout_proc0_evt_loop terminating... +[2023-09-14 12:35:45,987][53806] Stopping RolloutWorker_w1... +[2023-09-14 12:35:45,988][53806] Loop rollout_proc1_evt_loop terminating... +[2023-09-14 12:35:45,989][53811] Stopping RolloutWorker_w6... +[2023-09-14 12:35:45,990][53807] Stopping RolloutWorker_w3... +[2023-09-14 12:35:45,990][53811] Loop rollout_proc6_evt_loop terminating... +[2023-09-14 12:35:45,990][53807] Loop rollout_proc3_evt_loop terminating... +[2023-09-14 12:35:45,990][53805] Stopping RolloutWorker_w2... +[2023-09-14 12:35:45,991][53809] Stopping RolloutWorker_w5... +[2023-09-14 12:35:45,991][53805] Loop rollout_proc2_evt_loop terminating... +[2023-09-14 12:35:45,991][53809] Loop rollout_proc5_evt_loop terminating... +[2023-09-14 12:35:45,995][53810] Stopping RolloutWorker_w7... +[2023-09-14 12:35:45,995][53810] Loop rollout_proc7_evt_loop terminating... +[2023-09-14 12:35:45,996][53808] Stopping RolloutWorker_w4... +[2023-09-14 12:35:45,997][53808] Loop rollout_proc4_evt_loop terminating... +[2023-09-14 12:37:01,572][109198] Environment doom_basic already registered, overwriting... +[2023-09-14 12:37:01,574][109198] Environment doom_two_colors_easy already registered, overwriting... +[2023-09-14 12:37:01,576][109198] Environment doom_two_colors_hard already registered, overwriting... +[2023-09-14 12:37:01,577][109198] Environment doom_dm already registered, overwriting... +[2023-09-14 12:37:01,579][109198] Environment doom_dwango5 already registered, overwriting... +[2023-09-14 12:37:01,580][109198] Environment doom_my_way_home_flat_actions already registered, overwriting... +[2023-09-14 12:37:01,581][109198] Environment doom_defend_the_center_flat_actions already registered, overwriting... +[2023-09-14 12:37:01,582][109198] Environment doom_my_way_home already registered, overwriting... +[2023-09-14 12:37:01,583][109198] Environment doom_deadly_corridor already registered, overwriting... +[2023-09-14 12:37:01,584][109198] Environment doom_defend_the_center already registered, overwriting... +[2023-09-14 12:37:01,585][109198] Environment doom_defend_the_line already registered, overwriting... +[2023-09-14 12:37:01,585][109198] Environment doom_health_gathering already registered, overwriting... +[2023-09-14 12:37:01,586][109198] Environment doom_health_gathering_supreme already registered, overwriting... +[2023-09-14 12:37:01,586][109198] Environment doom_battle already registered, overwriting... +[2023-09-14 12:37:01,587][109198] Environment doom_battle2 already registered, overwriting... +[2023-09-14 12:37:01,588][109198] Environment doom_duel_bots already registered, overwriting... +[2023-09-14 12:37:01,588][109198] Environment doom_deathmatch_bots already registered, overwriting... +[2023-09-14 12:37:01,589][109198] Environment doom_duel already registered, overwriting... +[2023-09-14 12:37:01,589][109198] Environment doom_deathmatch_full already registered, overwriting... +[2023-09-14 12:37:01,590][109198] Environment doom_benchmark already registered, overwriting... +[2023-09-14 12:37:01,591][109198] register_encoder_factory: +[2023-09-14 12:37:01,613][109198] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json +[2023-09-14 12:37:01,614][109198] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists! +[2023-09-14 12:37:01,615][109198] Resuming existing experiment from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment... +[2023-09-14 12:37:01,616][109198] Weights and Biases integration disabled +[2023-09-14 12:37:01,619][109198] Environment var CUDA_VISIBLE_DEVICES is 0,1 + +[2023-09-14 12:37:03,541][109198] Starting experiment with the following configuration: +help=False +algo=APPO +env=doom_duel +experiment=default_experiment +train_dir=/home/cogstack/Documents/optuna/environments/sample_factory/train_dir +restart_behavior=resume +device=gpu +seed=None +num_policies=2 +async_rl=True +serial_mode=False +batched_sampling=False +num_batches_to_accumulate=2 +worker_num_splits=2 +policy_workers_per_policy=1 +max_policy_lag=1000 +num_workers=8 +num_envs_per_worker=4 +batch_size=1024 +num_batches_per_epoch=1 +num_epochs=1 +rollout=32 +recurrence=32 +shuffle_minibatches=False +gamma=0.99 +reward_scale=1.0 +reward_clip=1000.0 +value_bootstrap=False +normalize_returns=True +exploration_loss_coeff=0.001 +value_loss_coeff=0.5 +kl_loss_coeff=0.0 +exploration_loss=symmetric_kl +gae_lambda=0.95 +ppo_clip_ratio=0.1 +ppo_clip_value=0.2 +with_vtrace=False +vtrace_rho=1.0 +vtrace_c=1.0 +optimizer=adam +adam_eps=1e-06 +adam_beta1=0.9 +adam_beta2=0.999 +max_grad_norm=4.0 +learning_rate=0.0001 +lr_schedule=constant +lr_schedule_kl_threshold=0.008 +lr_adaptive_min=1e-06 +lr_adaptive_max=0.01 +obs_subtract_mean=0.0 +obs_scale=255.0 +normalize_input=True +normalize_input_keys=None +decorrelate_experience_max_seconds=0 +decorrelate_envs_on_one_worker=True +actor_worker_gpus=[] +set_workers_cpu_affinity=True +force_envs_single_thread=False +default_niceness=0 +log_to_file=True +experiment_summaries_interval=10 +flush_summaries_interval=30 +stats_avg=100 +summaries_use_frameskip=True +heartbeat_interval=20 +heartbeat_reporting_interval=600 +train_for_env_steps=10000000 +train_for_seconds=10000000000 +save_every_sec=120 +keep_checkpoints=2 +load_checkpoint_kind=latest +save_milestones_sec=-1 +save_best_every_sec=5 +save_best_metric=reward +save_best_after=100000 +benchmark=False +encoder_mlp_layers=[512, 512] +encoder_conv_architecture=convnet_simple +encoder_conv_mlp_layers=[512] +use_rnn=True +rnn_size=512 +rnn_type=gru +rnn_num_layers=1 +decoder_mlp_layers=[] +nonlinearity=elu +policy_initialization=orthogonal +policy_init_gain=1.0 +actor_critic_share_weights=True +adaptive_stddev=True +continuous_tanh_scale=0.0 +initial_stddev=1.0 +use_env_info_cache=False +env_gpu_actions=False +env_gpu_observations=True +env_frameskip=4 +env_framestack=1 +pixel_format=CHW +use_record_episode_statistics=False +with_wandb=False +wandb_user=None +wandb_project=sample_factory +wandb_group=None +wandb_job_type=SF +wandb_tags=[] +with_pbt=False +pbt_mix_policies_in_one_env=True +pbt_period_env_steps=5000000 +pbt_start_mutation=20000000 +pbt_replace_fraction=0.3 +pbt_mutation_rate=0.15 +pbt_replace_reward_gap=0.1 +pbt_replace_reward_gap_absolute=1e-06 +pbt_optimize_gamma=False +pbt_target_objective=true_objective +pbt_perturb_min=1.1 +pbt_perturb_max=1.5 +num_agents=-1 +num_humans=0 +num_bots=-1 +start_bot_difficulty=None +timelimit=None +res_w=128 +res_h=72 +wide_aspect_ratio=False +eval_env_frameskip=1 +fps=35 +command_line=--env=doom_dm --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=20000000 +cli_args={'env': 'doom_dm', 'num_workers': 8, 'num_envs_per_worker': 4, 'train_for_env_steps': 20000000} +git_hash=20b6d44612dad7d171f23e13b1f3b4c5e5631cf9 +git_repo_name=https://github.com/MattStammers/optuna.git +[2023-09-14 12:37:03,543][109198] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... +[2023-09-14 12:37:03,663][109198] Rollout worker 0 uses device cpu +[2023-09-14 12:37:03,664][109198] Rollout worker 1 uses device cpu +[2023-09-14 12:37:03,665][109198] Rollout worker 2 uses device cpu +[2023-09-14 12:37:03,667][109198] Rollout worker 3 uses device cpu +[2023-09-14 12:37:03,669][109198] Rollout worker 4 uses device cpu +[2023-09-14 12:37:03,671][109198] Rollout worker 5 uses device cpu +[2023-09-14 12:37:03,672][109198] Rollout worker 6 uses device cpu +[2023-09-14 12:37:03,673][109198] Rollout worker 7 uses device cpu +[2023-09-14 12:37:03,747][109198] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:37:03,748][109198] InferenceWorker_p0-w0: min num requests: 1 +[2023-09-14 12:37:03,753][109198] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:37:03,754][109198] InferenceWorker_p1-w0: min num requests: 1 +[2023-09-14 12:37:03,790][109198] Starting all processes... +[2023-09-14 12:37:03,792][109198] Starting process learner_proc0 +[2023-09-14 12:37:05,393][109198] Starting process learner_proc1 +[2023-09-14 12:37:05,395][74942] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:37:05,396][74942] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 +[2023-09-14 12:37:05,434][74942] Num visible devices: 1 +[2023-09-14 12:37:05,475][74942] Starting seed is not provided +[2023-09-14 12:37:05,475][74942] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:37:05,476][74942] Initializing actor-critic model on device cuda:0 +[2023-09-14 12:37:05,476][74942] RunningMeanStd input shape: (23,) +[2023-09-14 12:37:05,476][74942] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:37:05,477][74942] RunningMeanStd input shape: (1,) +[2023-09-14 12:37:05,488][74942] ConvEncoder: input_channels=3 +[2023-09-14 12:37:05,599][74942] Conv encoder output size: 512 +[2023-09-14 12:37:05,600][74942] Policy head output size: 640 +[2023-09-14 12:37:05,618][74942] Created Actor Critic model with architecture: +[2023-09-14 12:37:05,618][74942] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (measurements): RunningMeanStdInPlace() + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): VizdoomEncoder( + (basic_encoder): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ELU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ELU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ELU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ELU) + ) + ) + ) + (measurements_head): Sequential( + (0): Linear(in_features=23, out_features=128, bias=True) + (1): ELU(alpha=1.0) + (2): Linear(in_features=128, out_features=128, bias=True) + (3): ELU(alpha=1.0) + ) + ) + (core): ModelCoreRNN( + (core): GRU(640, 512) + ) + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=41, bias=True) + ) +) +[2023-09-14 12:37:06,503][74942] Using optimizer +[2023-09-14 12:37:06,504][74942] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001187_4861952.pth... +[2023-09-14 12:37:06,529][74942] Loading model from checkpoint +[2023-09-14 12:37:06,534][74942] Loaded experiment state at self.train_step=1187, self.env_steps=4861952 +[2023-09-14 12:37:06,535][74942] Initialized policy 0 weights for model version 1187 +[2023-09-14 12:37:06,536][74942] LearnerWorker_p0 finished initialization! +[2023-09-14 12:37:06,537][74942] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:37:07,036][75052] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:37:07,037][75052] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for learning process 1 +[2023-09-14 12:37:07,035][109198] Starting all processes... +[2023-09-14 12:37:07,041][109198] Starting process inference_proc0-0 +[2023-09-14 12:37:07,042][109198] Starting process inference_proc1-0 +[2023-09-14 12:37:07,043][109198] Starting process rollout_proc0 +[2023-09-14 12:37:07,043][109198] Starting process rollout_proc1 +[2023-09-14 12:37:07,044][109198] Starting process rollout_proc2 +[2023-09-14 12:37:07,045][109198] Starting process rollout_proc3 +[2023-09-14 12:37:07,073][75052] Num visible devices: 1 +[2023-09-14 12:37:07,045][109198] Starting process rollout_proc4 +[2023-09-14 12:37:07,046][109198] Starting process rollout_proc5 +[2023-09-14 12:37:07,047][109198] Starting process rollout_proc6 +[2023-09-14 12:37:07,048][109198] Starting process rollout_proc7 +[2023-09-14 12:37:07,119][75052] Starting seed is not provided +[2023-09-14 12:37:07,119][75052] Using GPUs [0] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:37:07,120][75052] Initializing actor-critic model on device cuda:0 +[2023-09-14 12:37:07,120][75052] RunningMeanStd input shape: (23,) +[2023-09-14 12:37:07,121][75052] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:37:07,121][75052] RunningMeanStd input shape: (1,) +[2023-09-14 12:37:07,140][75052] ConvEncoder: input_channels=3 +[2023-09-14 12:37:07,369][75052] Conv encoder output size: 512 +[2023-09-14 12:37:07,370][75052] Policy head output size: 640 +[2023-09-14 12:37:07,400][75052] Created Actor Critic model with architecture: +[2023-09-14 12:37:07,400][75052] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (measurements): RunningMeanStdInPlace() + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): VizdoomEncoder( + (basic_encoder): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ELU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ELU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ELU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ELU) + ) + ) + ) + (measurements_head): Sequential( + (0): Linear(in_features=23, out_features=128, bias=True) + (1): ELU(alpha=1.0) + (2): Linear(in_features=128, out_features=128, bias=True) + (3): ELU(alpha=1.0) + ) + ) + (core): ModelCoreRNN( + (core): GRU(640, 512) + ) + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=41, bias=True) + ) +) +[2023-09-14 12:37:08,655][75052] Using optimizer +[2023-09-14 12:37:08,656][75052] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000481_1970176.pth... +[2023-09-14 12:37:08,685][75052] Loading model from checkpoint +[2023-09-14 12:37:08,690][75052] Loaded experiment state at self.train_step=481, self.env_steps=1970176 +[2023-09-14 12:37:08,691][75052] Initialized policy 1 weights for model version 481 +[2023-09-14 12:37:08,693][75052] LearnerWorker_p1 finished initialization! +[2023-09-14 12:37:08,693][75052] Using GPUs [0] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:37:08,973][75218] Worker 3 uses CPU cores [12, 13, 14, 15] +[2023-09-14 12:37:09,067][75219] Worker 4 uses CPU cores [16, 17, 18, 19] +[2023-09-14 12:37:09,075][75215] Worker 1 uses CPU cores [4, 5, 6, 7] +[2023-09-14 12:37:09,077][75217] Worker 2 uses CPU cores [8, 9, 10, 11] +[2023-09-14 12:37:09,323][75216] Worker 0 uses CPU cores [0, 1, 2, 3] +[2023-09-14 12:37:09,474][75209] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:37:09,474][75209] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for inference process 1 +[2023-09-14 12:37:09,491][75209] Num visible devices: 1 +[2023-09-14 12:37:09,616][75254] Worker 7 uses CPU cores [28, 29, 30, 31] +[2023-09-14 12:37:09,660][75252] Worker 5 uses CPU cores [20, 21, 22, 23] +[2023-09-14 12:37:09,685][75253] Worker 6 uses CPU cores [24, 25, 26, 27] +[2023-09-14 12:37:09,699][75214] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:37:09,699][75214] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 +[2023-09-14 12:37:09,718][75214] Num visible devices: 1 +[2023-09-14 12:37:10,169][75209] RunningMeanStd input shape: (23,) +[2023-09-14 12:37:10,170][75209] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:37:10,170][75209] RunningMeanStd input shape: (1,) +[2023-09-14 12:37:10,182][75209] ConvEncoder: input_channels=3 +[2023-09-14 12:37:10,286][75209] Conv encoder output size: 512 +[2023-09-14 12:37:10,287][75209] Policy head output size: 640 +[2023-09-14 12:37:10,315][75214] RunningMeanStd input shape: (23,) +[2023-09-14 12:37:10,315][75214] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:37:10,316][75214] RunningMeanStd input shape: (1,) +[2023-09-14 12:37:10,327][75214] ConvEncoder: input_channels=3 +[2023-09-14 12:37:10,435][75214] Conv encoder output size: 512 +[2023-09-14 12:37:10,436][75214] Policy head output size: 640 +[2023-09-14 12:37:10,565][109198] Inference worker 1-0 is ready! +[2023-09-14 12:37:10,723][109198] Inference worker 0-0 is ready! +[2023-09-14 12:37:10,724][109198] All inference workers are ready! Signal rollout workers to start! +[2023-09-14 12:37:10,729][75218] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,729][75219] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,729][75215] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,730][75252] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,731][75216] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,732][75217] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,732][75254] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,733][75253] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,764][75218] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:37:10,765][75216] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:37:10,768][75216] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,769][75218] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,769][75252] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:37:10,772][75217] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:37:10,772][75252] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,774][75254] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:37:10,775][75217] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,775][75253] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:37:10,776][75215] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:37:10,776][75219] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:37:10,778][75254] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,779][75253] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,780][75215] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,780][75219] Multi agent env, num agents: 2 +[2023-09-14 12:37:10,807][75217] Port 40500 is available +[2023-09-14 12:37:10,807][75252] Port 40800 is available +[2023-09-14 12:37:10,807][75216] Port 40300 is available +[2023-09-14 12:37:10,807][75217] Using port 40500 +[2023-09-14 12:37:10,807][75252] Using port 40800 +[2023-09-14 12:37:10,807][75216] Using port 40300 +[2023-09-14 12:37:10,808][75217] Initializing env for player 0, init_info: {'port': 40500}... +[2023-09-14 12:37:10,808][75252] Initializing env for player 0, init_info: {'port': 40800}... +[2023-09-14 12:37:10,808][75216] Initializing env for player 0, init_info: {'port': 40300}... +[2023-09-14 12:37:10,810][75254] UDP port 41000 cannot be used [Errno 98] Address already in use +[2023-09-14 12:37:10,810][75254] Port 42000 is available +[2023-09-14 12:37:10,811][75254] Using port 42000 +[2023-09-14 12:37:10,813][75254] Initializing env for player 0, init_info: {'port': 42000}... +[2023-09-14 12:37:10,814][75218] Port 40600 is available +[2023-09-14 12:37:10,814][75218] Using port 40600 +[2023-09-14 12:37:10,815][75218] Initializing env for player 0, init_info: {'port': 40600}... +[2023-09-14 12:37:10,825][75253] Port 40900 is available +[2023-09-14 12:37:10,825][75253] Using port 40900 +[2023-09-14 12:37:10,826][75215] Port 40400 is available +[2023-09-14 12:37:10,826][75215] Using port 40400 +[2023-09-14 12:37:10,826][75253] Initializing env for player 0, init_info: {'port': 40900}... +[2023-09-14 12:37:10,826][75219] Port 40700 is available +[2023-09-14 12:37:10,827][75219] Using port 40700 +[2023-09-14 12:37:10,827][75215] Initializing env for player 0, init_info: {'port': 40400}... +[2023-09-14 12:37:10,837][75217] Using port 40500 on host... +[2023-09-14 12:37:10,841][75254] Using port 42000 on host... +[2023-09-14 12:37:10,843][75216] Using port 40300 on host... +[2023-09-14 12:37:10,849][75218] Using port 40600 on host... +[2023-09-14 12:37:10,854][75252] Using port 40800 on host... +[2023-09-14 12:37:10,855][75253] Using port 40900 on host... +[2023-09-14 12:37:10,858][75217] Initializing env for player 1, init_info: {'port': 40500}... +[2023-09-14 12:37:10,858][75216] Initializing env for player 1, init_info: {'port': 40300}... +[2023-09-14 12:37:10,860][75215] Using port 40400 on host... +[2023-09-14 12:37:10,860][75252] Initializing env for player 1, init_info: {'port': 40800}... +[2023-09-14 12:37:10,863][75254] Initializing env for player 1, init_info: {'port': 42000}... +[2023-09-14 12:37:10,865][75218] Initializing env for player 1, init_info: {'port': 40600}... +[2023-09-14 12:37:10,877][75253] Initializing env for player 1, init_info: {'port': 40900}... +[2023-09-14 12:37:10,878][75215] Initializing env for player 1, init_info: {'port': 40400}... +[2023-09-14 12:37:11,619][109198] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 6832128. Throughput: 0: nan, 1: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:37:11,938][75216] Initialized w:0 v:0 player:1 +[2023-09-14 12:37:11,941][75216] Initialized w:0 v:0 player:0 +[2023-09-14 12:37:11,941][75216] 2 agent workers initialized for env 0! +[2023-09-14 12:37:11,948][75253] Initialized w:6 v:0 player:0 +[2023-09-14 12:37:11,949][75253] Initialized w:6 v:0 player:1 +[2023-09-14 12:37:11,950][75253] 2 agent workers initialized for env 6! +[2023-09-14 12:37:11,956][75216] Decorrelating experience for 0 frames... +[2023-09-14 12:37:11,957][75216] Port 40301 is available +[2023-09-14 12:37:11,957][75216] Using port 40301 +[2023-09-14 12:37:11,964][75253] Decorrelating experience for 0 frames... +[2023-09-14 12:37:11,965][75253] Port 40901 is available +[2023-09-14 12:37:11,965][75253] Using port 40901 +[2023-09-14 12:37:11,965][75253] Initializing env for player 0, init_info: {'port': 40901}... +[2023-09-14 12:37:11,985][75252] Initialized w:5 v:0 player:1 +[2023-09-14 12:37:11,986][75252] Initialized w:5 v:0 player:0 +[2023-09-14 12:37:11,987][75252] 2 agent workers initialized for env 5! +[2023-09-14 12:37:11,992][75217] Initialized w:2 v:0 player:0 +[2023-09-14 12:37:11,993][75217] Initialized w:2 v:0 player:1 +[2023-09-14 12:37:11,994][75253] Using port 40901 on host... +[2023-09-14 12:37:11,995][75217] 2 agent workers initialized for env 2! +[2023-09-14 12:37:11,997][75252] Decorrelating experience for 0 frames... +[2023-09-14 12:37:11,998][75252] Port 40801 is available +[2023-09-14 12:37:11,998][75252] Using port 40801 +[2023-09-14 12:37:11,999][75252] Initializing env for player 0, init_info: {'port': 40801}... +[2023-09-14 12:37:12,001][75218] Initialized w:3 v:0 player:0 +[2023-09-14 12:37:12,001][75218] Initialized w:3 v:0 player:1 +[2023-09-14 12:37:12,003][75218] 2 agent workers initialized for env 3! +[2023-09-14 12:37:12,003][75215] Initialized w:1 v:0 player:0 +[2023-09-14 12:37:12,003][75215] Initialized w:1 v:0 player:1 +[2023-09-14 12:37:12,005][75215] 2 agent workers initialized for env 1! +[2023-09-14 12:37:12,006][75217] Decorrelating experience for 0 frames... +[2023-09-14 12:37:12,006][75217] Port 40501 is available +[2023-09-14 12:37:12,007][75217] Using port 40501 +[2023-09-14 12:37:12,008][75216] Initializing env for player 0, init_info: {'port': 40301}... +[2023-09-14 12:37:12,009][75254] Initialized w:7 v:0 player:1 +[2023-09-14 12:37:12,010][75254] Initialized w:7 v:0 player:0 +[2023-09-14 12:37:12,012][75254] 2 agent workers initialized for env 7! +[2023-09-14 12:37:12,016][75215] Decorrelating experience for 0 frames... +[2023-09-14 12:37:12,016][75253] Initializing env for player 1, init_info: {'port': 40901}... +[2023-09-14 12:37:12,016][75215] Port 40401 is available +[2023-09-14 12:37:12,017][75215] Using port 40401 +[2023-09-14 12:37:12,017][75218] Decorrelating experience for 0 frames... +[2023-09-14 12:37:12,017][75215] Initializing env for player 0, init_info: {'port': 40401}... +[2023-09-14 12:37:12,017][75218] Port 40601 is available +[2023-09-14 12:37:12,017][75218] Using port 40601 +[2023-09-14 12:37:12,018][75218] Initializing env for player 0, init_info: {'port': 40601}... +[2023-09-14 12:37:12,029][75252] Using port 40801 on host... +[2023-09-14 12:37:12,029][75254] Decorrelating experience for 0 frames... +[2023-09-14 12:37:12,030][75254] UDP port 41001 cannot be used [Errno 98] Address already in use +[2023-09-14 12:37:12,030][75254] Port 42001 is available +[2023-09-14 12:37:12,031][75254] Using port 42001 +[2023-09-14 12:37:12,031][75254] Initializing env for player 0, init_info: {'port': 42001}... +[2023-09-14 12:37:12,038][75219] Initializing env for player 0, init_info: {'port': 40700}... +[2023-09-14 12:37:12,038][75216] Using port 40301 on host... +[2023-09-14 12:37:12,049][75218] Using port 40601 on host... +[2023-09-14 12:37:12,049][75252] Initializing env for player 1, init_info: {'port': 40801}... +[2023-09-14 12:37:12,052][75215] Using port 40401 on host... +[2023-09-14 12:37:12,058][75216] Initializing env for player 1, init_info: {'port': 40301}... +[2023-09-14 12:37:12,062][75254] Using port 42001 on host... +[2023-09-14 12:37:12,068][75215] Initializing env for player 1, init_info: {'port': 40401}... +[2023-09-14 12:37:12,068][75218] Initializing env for player 1, init_info: {'port': 40601}... +[2023-09-14 12:37:12,082][75219] Using port 40700 on host... +[2023-09-14 12:37:12,082][75254] Initializing env for player 1, init_info: {'port': 42001}... +[2023-09-14 12:37:12,089][75219] Initializing env for player 1, init_info: {'port': 40700}... +[2023-09-14 12:37:13,052][75253] Initialized w:6 v:1 player:0 +[2023-09-14 12:37:13,053][75253] Initialized w:6 v:1 player:1 +[2023-09-14 12:37:13,054][75253] 2 agent workers initialized for env 6! +[2023-09-14 12:37:13,064][75253] Decorrelating experience for 32 frames... +[2023-09-14 12:37:13,067][75217] Initializing env for player 0, init_info: {'port': 40501}... +[2023-09-14 12:37:13,103][75217] Using port 40501 on host... +[2023-09-14 12:37:13,118][75217] Initializing env for player 1, init_info: {'port': 40501}... +[2023-09-14 12:37:13,135][75253] Multi agent env, num agents: 2 +[2023-09-14 12:37:13,144][75254] Initialized w:7 v:1 player:1 +[2023-09-14 12:37:13,144][75254] Initialized w:7 v:1 player:0 +[2023-09-14 12:37:13,146][75254] 2 agent workers initialized for env 7! +[2023-09-14 12:37:13,164][75253] Multi agent env, num agents: 2 +[2023-09-14 12:37:13,167][75215] Initialized w:1 v:1 player:0 +[2023-09-14 12:37:13,168][75215] Initialized w:1 v:1 player:1 +[2023-09-14 12:37:13,169][75254] Decorrelating experience for 32 frames... +[2023-09-14 12:37:13,169][75215] 2 agent workers initialized for env 1! +[2023-09-14 12:37:13,179][75215] Decorrelating experience for 32 frames... +[2023-09-14 12:37:13,188][75218] Initialized w:3 v:1 player:1 +[2023-09-14 12:37:13,189][75218] Initialized w:3 v:1 player:0 +[2023-09-14 12:37:13,189][75216] Initialized w:0 v:1 player:0 +[2023-09-14 12:37:13,190][75216] Initialized w:0 v:1 player:1 +[2023-09-14 12:37:13,190][75218] 2 agent workers initialized for env 3! +[2023-09-14 12:37:13,191][75216] 2 agent workers initialized for env 0! +[2023-09-14 12:37:13,194][75253] Port 40902 is available +[2023-09-14 12:37:13,194][75253] Using port 40902 +[2023-09-14 12:37:13,194][75253] Initializing env for player 0, init_info: {'port': 40902}... +[2023-09-14 12:37:13,198][75216] Decorrelating experience for 32 frames... +[2023-09-14 12:37:13,200][75218] Decorrelating experience for 32 frames... +[2023-09-14 12:37:13,217][75252] Initialized w:5 v:1 player:1 +[2023-09-14 12:37:13,218][75252] Initialized w:5 v:1 player:0 +[2023-09-14 12:37:13,219][75252] 2 agent workers initialized for env 5! +[2023-09-14 12:37:13,227][75253] Using port 40902 on host... +[2023-09-14 12:37:13,228][75219] Initialized w:4 v:0 player:1 +[2023-09-14 12:37:13,228][75219] Initialized w:4 v:0 player:0 +[2023-09-14 12:37:13,229][75252] Decorrelating experience for 32 frames... +[2023-09-14 12:37:13,230][75219] 2 agent workers initialized for env 4! +[2023-09-14 12:37:13,239][75219] Decorrelating experience for 0 frames... +[2023-09-14 12:37:13,239][75219] Port 40701 is available +[2023-09-14 12:37:13,240][75219] Using port 40701 +[2023-09-14 12:37:13,240][75219] Initializing env for player 0, init_info: {'port': 40701}... +[2023-09-14 12:37:13,241][75254] Multi agent env, num agents: 2 +[2023-09-14 12:37:13,245][75253] Initializing env for player 1, init_info: {'port': 40902}... +[2023-09-14 12:37:13,257][75215] Multi agent env, num agents: 2 +[2023-09-14 12:37:13,266][75216] Multi agent env, num agents: 2 +[2023-09-14 12:37:13,278][75218] Multi agent env, num agents: 2 +[2023-09-14 12:37:13,279][75254] Multi agent env, num agents: 2 +[2023-09-14 12:37:13,280][75219] Using port 40701 on host... +[2023-09-14 12:37:13,291][75219] Initializing env for player 1, init_info: {'port': 40701}... +[2023-09-14 12:37:13,301][75216] Multi agent env, num agents: 2 +[2023-09-14 12:37:13,303][75252] Multi agent env, num agents: 2 +[2023-09-14 12:37:13,304][75215] Multi agent env, num agents: 2 +[2023-09-14 12:37:13,327][75254] UDP port 41002 cannot be used [Errno 98] Address already in use +[2023-09-14 12:37:13,328][75254] Port 42002 is available +[2023-09-14 12:37:13,328][75218] Multi agent env, num agents: 2 +[2023-09-14 12:37:13,328][75254] Using port 42002 +[2023-09-14 12:37:13,330][75216] Port 40302 is available +[2023-09-14 12:37:13,330][75216] Using port 40302 +[2023-09-14 12:37:13,331][75216] Initializing env for player 0, init_info: {'port': 40302}... +[2023-09-14 12:37:13,350][75215] Port 40402 is available +[2023-09-14 12:37:13,350][75252] Multi agent env, num agents: 2 +[2023-09-14 12:37:13,350][75215] Using port 40402 +[2023-09-14 12:37:13,350][75215] Initializing env for player 0, init_info: {'port': 40402}... +[2023-09-14 12:37:13,357][75218] Port 40602 is available +[2023-09-14 12:37:13,357][75218] Using port 40602 +[2023-09-14 12:37:13,358][75218] Initializing env for player 0, init_info: {'port': 40602}... +[2023-09-14 12:37:13,359][75216] Using port 40302 on host... +[2023-09-14 12:37:13,381][75216] Initializing env for player 1, init_info: {'port': 40302}... +[2023-09-14 12:37:13,385][75215] Using port 40402 on host... +[2023-09-14 12:37:13,390][75218] Using port 40602 on host... +[2023-09-14 12:37:13,395][75252] Port 40802 is available +[2023-09-14 12:37:13,395][75252] Using port 40802 +[2023-09-14 12:37:13,396][75252] Initializing env for player 0, init_info: {'port': 40802}... +[2023-09-14 12:37:13,401][75215] Initializing env for player 1, init_info: {'port': 40402}... +[2023-09-14 12:37:13,408][75218] Initializing env for player 1, init_info: {'port': 40602}... +[2023-09-14 12:37:13,441][75252] Using port 40802 on host... +[2023-09-14 12:37:13,449][75252] Initializing env for player 1, init_info: {'port': 40802}... +[2023-09-14 12:37:14,216][75217] Initialized w:2 v:1 player:1 +[2023-09-14 12:37:14,217][75217] Initialized w:2 v:1 player:0 +[2023-09-14 12:37:14,219][75217] 2 agent workers initialized for env 2! +[2023-09-14 12:37:14,233][75217] Decorrelating experience for 32 frames... +[2023-09-14 12:37:14,239][75254] Initializing env for player 0, init_info: {'port': 42002}... +[2023-09-14 12:37:14,279][75254] Using port 42002 on host... +[2023-09-14 12:37:14,289][75254] Initializing env for player 1, init_info: {'port': 42002}... +[2023-09-14 12:37:14,302][75217] Multi agent env, num agents: 2 +[2023-09-14 12:37:14,334][75217] Multi agent env, num agents: 2 +[2023-09-14 12:37:14,350][75253] Initialized w:6 v:2 player:0 +[2023-09-14 12:37:14,351][75253] Initialized w:6 v:2 player:1 +[2023-09-14 12:37:14,353][75253] 2 agent workers initialized for env 6! +[2023-09-14 12:37:14,363][75253] Decorrelating experience for 64 frames... +[2023-09-14 12:37:14,374][75217] Port 40502 is available +[2023-09-14 12:37:14,374][75217] Using port 40502 +[2023-09-14 12:37:14,374][75217] Initializing env for player 0, init_info: {'port': 40502}... +[2023-09-14 12:37:14,409][75217] Using port 40502 on host... +[2023-09-14 12:37:14,412][75216] Initialized w:0 v:2 player:0 +[2023-09-14 12:37:14,413][75216] Initialized w:0 v:2 player:1 +[2023-09-14 12:37:14,414][75216] 2 agent workers initialized for env 0! +[2023-09-14 12:37:14,425][75217] Initializing env for player 1, init_info: {'port': 40502}... +[2023-09-14 12:37:14,432][75216] Decorrelating experience for 64 frames... +[2023-09-14 12:37:14,440][75219] Initialized w:4 v:1 player:0 +[2023-09-14 12:37:14,441][75219] Initialized w:4 v:1 player:1 +[2023-09-14 12:37:14,443][75219] 2 agent workers initialized for env 4! +[2023-09-14 12:37:14,452][75219] Decorrelating experience for 32 frames... +[2023-09-14 12:37:14,453][75218] Initialized w:3 v:2 player:0 +[2023-09-14 12:37:14,453][75218] Initialized w:3 v:2 player:1 +[2023-09-14 12:37:14,455][75218] 2 agent workers initialized for env 3! +[2023-09-14 12:37:14,467][75218] Decorrelating experience for 64 frames... +[2023-09-14 12:37:14,504][75253] Port 40903 is available +[2023-09-14 12:37:14,504][75253] Using port 40903 +[2023-09-14 12:37:14,533][75215] Initialized w:1 v:2 player:0 +[2023-09-14 12:37:14,534][75215] Initialized w:1 v:2 player:1 +[2023-09-14 12:37:14,535][75219] Multi agent env, num agents: 2 +[2023-09-14 12:37:14,535][75215] 2 agent workers initialized for env 1! +[2023-09-14 12:37:14,542][75215] Decorrelating experience for 64 frames... +[2023-09-14 12:37:14,581][75219] Multi agent env, num agents: 2 +[2023-09-14 12:37:14,600][75216] Port 40303 is available +[2023-09-14 12:37:14,600][75216] Using port 40303 +[2023-09-14 12:37:14,613][75252] Initialized w:5 v:2 player:1 +[2023-09-14 12:37:14,614][75252] Initialized w:5 v:2 player:0 +[2023-09-14 12:37:14,614][75252] 2 agent workers initialized for env 5! +[2023-09-14 12:37:14,624][75252] Decorrelating experience for 64 frames... +[2023-09-14 12:37:14,626][75219] Port 40702 is available +[2023-09-14 12:37:14,626][75219] Using port 40702 +[2023-09-14 12:37:14,627][75219] Initializing env for player 0, init_info: {'port': 40702}... +[2023-09-14 12:37:14,628][75218] Port 40603 is available +[2023-09-14 12:37:14,629][75218] Using port 40603 +[2023-09-14 12:37:14,629][75218] Initializing env for player 0, init_info: {'port': 40603}... +[2023-09-14 12:37:14,658][75219] Using port 40702 on host... +[2023-09-14 12:37:14,659][75218] Using port 40603 on host... +[2023-09-14 12:37:14,679][75219] Initializing env for player 1, init_info: {'port': 40702}... +[2023-09-14 12:37:14,680][75218] Initializing env for player 1, init_info: {'port': 40603}... +[2023-09-14 12:37:14,712][75215] Port 40403 is available +[2023-09-14 12:37:14,712][75215] Using port 40403 +[2023-09-14 12:37:14,781][75252] Port 40803 is available +[2023-09-14 12:37:14,782][75252] Using port 40803 +[2023-09-14 12:37:14,782][75252] Initializing env for player 0, init_info: {'port': 40803}... +[2023-09-14 12:37:14,810][75252] Using port 40803 on host... +[2023-09-14 12:37:14,832][75252] Initializing env for player 1, init_info: {'port': 40803}... +[2023-09-14 12:37:15,373][75254] Initialized w:7 v:2 player:0 +[2023-09-14 12:37:15,374][75254] Initialized w:7 v:2 player:1 +[2023-09-14 12:37:15,375][75254] 2 agent workers initialized for env 7! +[2023-09-14 12:37:15,385][75254] Decorrelating experience for 64 frames... +[2023-09-14 12:37:15,414][75216] Initializing env for player 0, init_info: {'port': 40303}... +[2023-09-14 12:37:15,443][75216] Using port 40303 on host... +[2023-09-14 12:37:15,465][75216] Initializing env for player 1, init_info: {'port': 40303}... +[2023-09-14 12:37:15,474][75217] Initialized w:2 v:2 player:1 +[2023-09-14 12:37:15,475][75217] Initialized w:2 v:2 player:0 +[2023-09-14 12:37:15,477][75217] 2 agent workers initialized for env 2! +[2023-09-14 12:37:15,492][75217] Decorrelating experience for 64 frames... +[2023-09-14 12:37:15,515][75253] Initializing env for player 0, init_info: {'port': 40903}... +[2023-09-14 12:37:15,529][75254] Port 41003 is available +[2023-09-14 12:37:15,529][75254] Using port 41003 +[2023-09-14 12:37:15,529][75254] Initializing env for player 0, init_info: {'port': 41003}... +[2023-09-14 12:37:15,548][75253] Using port 40903 on host... +[2023-09-14 12:37:15,565][75253] Initializing env for player 1, init_info: {'port': 40903}... +[2023-09-14 12:37:15,567][75254] Using port 41003 on host... +[2023-09-14 12:37:15,580][75254] Initializing env for player 1, init_info: {'port': 41003}... +[2023-09-14 12:37:15,636][75217] Port 40503 is available +[2023-09-14 12:37:15,636][75217] Using port 40503 +[2023-09-14 12:37:15,636][75217] Initializing env for player 0, init_info: {'port': 40503}... +[2023-09-14 12:37:15,665][75217] Using port 40503 on host... +[2023-09-14 12:37:15,687][75217] Initializing env for player 1, init_info: {'port': 40503}... +[2023-09-14 12:37:15,710][75218] Initialized w:3 v:3 player:0 +[2023-09-14 12:37:15,711][75218] Initialized w:3 v:3 player:1 +[2023-09-14 12:37:15,712][75218] 2 agent workers initialized for env 3! +[2023-09-14 12:37:15,722][75218] Decorrelating experience for 96 frames... +[2023-09-14 12:37:15,837][75219] Initialized w:4 v:2 player:0 +[2023-09-14 12:37:15,837][75219] Initialized w:4 v:2 player:1 +[2023-09-14 12:37:15,839][75219] 2 agent workers initialized for env 4! +[2023-09-14 12:37:15,849][75219] Decorrelating experience for 64 frames... +[2023-09-14 12:37:15,855][75252] Initialized w:5 v:3 player:1 +[2023-09-14 12:37:15,856][75252] Initialized w:5 v:3 player:0 +[2023-09-14 12:37:15,857][75252] 2 agent workers initialized for env 5! +[2023-09-14 12:37:15,866][75252] Decorrelating experience for 96 frames... +[2023-09-14 12:37:15,873][75215] Initializing env for player 0, init_info: {'port': 40403}... +[2023-09-14 12:37:15,918][75215] Using port 40403 on host... +[2023-09-14 12:37:15,926][75215] Initializing env for player 1, init_info: {'port': 40403}... +[2023-09-14 12:37:15,983][75219] Port 40703 is available +[2023-09-14 12:37:15,983][75219] Using port 40703 +[2023-09-14 12:37:15,983][75219] Initializing env for player 0, init_info: {'port': 40703}... +[2023-09-14 12:37:16,013][75219] Using port 40703 on host... +[2023-09-14 12:37:16,034][75219] Initializing env for player 1, init_info: {'port': 40703}... +[2023-09-14 12:37:16,489][75216] Initialized w:0 v:3 player:1 +[2023-09-14 12:37:16,489][75216] Initialized w:0 v:3 player:0 +[2023-09-14 12:37:16,490][75216] 2 agent workers initialized for env 0! +[2023-09-14 12:37:16,498][75216] Decorrelating experience for 96 frames... +[2023-09-14 12:37:16,597][75253] Initialized w:6 v:3 player:1 +[2023-09-14 12:37:16,599][75253] Initialized w:6 v:3 player:0 +[2023-09-14 12:37:16,600][75253] 2 agent workers initialized for env 6! +[2023-09-14 12:37:16,614][75253] Decorrelating experience for 96 frames... +[2023-09-14 12:37:16,619][109198] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 6832128. Throughput: 0: 0.0, 1: 42.0. Samples: 210. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:37:16,671][75254] Initialized w:7 v:3 player:0 +[2023-09-14 12:37:16,672][75254] Initialized w:7 v:3 player:1 +[2023-09-14 12:37:16,673][75254] 2 agent workers initialized for env 7! +[2023-09-14 12:37:16,683][75254] Decorrelating experience for 96 frames... +[2023-09-14 12:37:16,710][75217] Initialized w:2 v:3 player:1 +[2023-09-14 12:37:16,711][75217] Initialized w:2 v:3 player:0 +[2023-09-14 12:37:16,712][75217] 2 agent workers initialized for env 2! +[2023-09-14 12:37:16,721][75217] Decorrelating experience for 96 frames... +[2023-09-14 12:37:17,079][75219] Initialized w:4 v:3 player:1 +[2023-09-14 12:37:17,080][75219] Initialized w:4 v:3 player:0 +[2023-09-14 12:37:17,082][75219] 2 agent workers initialized for env 4! +[2023-09-14 12:37:17,092][75219] Decorrelating experience for 96 frames... +[2023-09-14 12:37:17,098][75215] Initialized w:1 v:3 player:0 +[2023-09-14 12:37:17,099][75215] Initialized w:1 v:3 player:1 +[2023-09-14 12:37:17,100][75215] 2 agent workers initialized for env 1! +[2023-09-14 12:37:17,111][75215] Decorrelating experience for 96 frames... +[2023-09-14 12:37:18,407][74942] Signal inference workers to stop experience collection... +[2023-09-14 12:37:18,414][75209] InferenceWorker_p1-w0: stopping experience collection +[2023-09-14 12:37:18,418][75214] InferenceWorker_p0-w0: stopping experience collection +[2023-09-14 12:37:21,400][74942] Signal inference workers to resume experience collection... +[2023-09-14 12:37:21,401][75214] InferenceWorker_p0-w0: resuming experience collection +[2023-09-14 12:37:21,401][75209] InferenceWorker_p1-w0: resuming experience collection +[2023-09-14 12:37:21,619][109198] Fps is (10 sec: 409.6, 60 sec: 409.6, 300 sec: 409.6). Total num frames: 6836224. Throughput: 0: 276.8, 1: 204.4. Samples: 4812. Policy #0 lag: (min: 0.0, avg: 0.0, max: 0.0) +[2023-09-14 12:37:23,290][75052] Signal inference workers to stop experience collection... +[2023-09-14 12:37:23,730][109198] Heartbeat connected on Batcher_0 +[2023-09-14 12:37:23,734][109198] Heartbeat connected on LearnerWorker_p0 +[2023-09-14 12:37:23,739][109198] Heartbeat connected on Batcher_1 +[2023-09-14 12:37:23,748][109198] Heartbeat connected on InferenceWorker_p0-w0 +[2023-09-14 12:37:23,754][109198] Heartbeat connected on InferenceWorker_p1-w0 +[2023-09-14 12:37:23,760][109198] Heartbeat connected on RolloutWorker_w0 +[2023-09-14 12:37:23,764][109198] Heartbeat connected on RolloutWorker_w1 +[2023-09-14 12:37:23,768][75052] Signal inference workers to resume experience collection... +[2023-09-14 12:37:23,768][109198] Heartbeat connected on RolloutWorker_w2 +[2023-09-14 12:37:23,772][109198] Heartbeat connected on RolloutWorker_w3 +[2023-09-14 12:37:23,777][109198] Heartbeat connected on RolloutWorker_w4 +[2023-09-14 12:37:23,781][109198] Heartbeat connected on RolloutWorker_w5 +[2023-09-14 12:37:23,806][109198] Heartbeat connected on RolloutWorker_w6 +[2023-09-14 12:37:23,815][109198] Heartbeat connected on RolloutWorker_w7 +[2023-09-14 12:37:24,239][109198] Heartbeat connected on LearnerWorker_p1 +[2023-09-14 12:37:26,619][109198] Fps is (10 sec: 6144.1, 60 sec: 4096.0, 300 sec: 4096.0). Total num frames: 6893568. Throughput: 0: 562.1, 1: 390.4. Samples: 14288. Policy #0 lag: (min: 0.0, avg: 1.1, max: 3.0) +[2023-09-14 12:37:27,219][75214] Updated weights for policy 0, policy_version 1197 (0.0697) +[2023-09-14 12:37:29,320][75209] Updated weights for policy 1, policy_version 491 (0.0018) +[2023-09-14 12:37:31,619][109198] Fps is (10 sec: 12288.3, 60 sec: 6348.8, 300 sec: 6348.8). Total num frames: 6959104. Throughput: 0: 690.6, 1: 697.4. Samples: 27760. Policy #0 lag: (min: 0.0, avg: 0.9, max: 2.0) +[2023-09-14 12:37:32,425][75214] Updated weights for policy 0, policy_version 1207 (0.0012) +[2023-09-14 12:37:36,248][75209] Updated weights for policy 1, policy_version 501 (0.0012) +[2023-09-14 12:37:36,619][109198] Fps is (10 sec: 13516.9, 60 sec: 7864.3, 300 sec: 7864.3). Total num frames: 7028736. Throughput: 0: 1047.8, 1: 743.8. Samples: 44789. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:37:37,225][75214] Updated weights for policy 0, policy_version 1217 (0.0012) +[2023-09-14 12:37:41,619][109198] Fps is (10 sec: 14745.6, 60 sec: 9147.8, 300 sec: 9147.8). Total num frames: 7106560. Throughput: 0: 1297.6, 1: 918.7. Samples: 66489. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:37:42,111][75214] Updated weights for policy 0, policy_version 1227 (0.0013) +[2023-09-14 12:37:42,915][75209] Updated weights for policy 1, policy_version 511 (0.0013) +[2023-09-14 12:37:46,619][109198] Fps is (10 sec: 14745.6, 60 sec: 9830.4, 300 sec: 9830.4). Total num frames: 7176192. Throughput: 0: 1298.3, 1: 1051.7. Samples: 82250. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:37:46,871][75214] Updated weights for policy 0, policy_version 1237 (0.0012) +[2023-09-14 12:37:49,876][75209] Updated weights for policy 1, policy_version 521 (0.0011) +[2023-09-14 12:37:51,619][109198] Fps is (10 sec: 13926.2, 60 sec: 10342.4, 300 sec: 10342.4). Total num frames: 7245824. Throughput: 0: 1439.7, 1: 1022.9. Samples: 98505. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:37:51,894][75214] Updated weights for policy 0, policy_version 1247 (0.0015) +[2023-09-14 12:37:54,390][75253] DAMAGECOUNT value on done: 85.0 +[2023-09-14 12:37:54,391][75253] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:37:54,392][75253] Sum rewards: 5.616, reward structure: {'HEALTH': '-0.850', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.024', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.196', 'WEAPON3': '0.200', 'weapon2': '0.362', 'weapon3': '0.968', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon5': '2.436'} +[2023-09-14 12:37:54,701][75253] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:37:55,030][75253] DAMAGECOUNT value on done: 320.0 +[2023-09-14 12:37:55,030][75253] DAMAGECOUNT value on done: 355.0 +[2023-09-14 12:37:55,031][75253] Sum rewards: 5.033, reward structure: {'HEALTH': '-3.400', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.025', 'weapon5': '0.038', 'AMMO3': '0.103', 'weapon2': '0.110', 'AMMO4': '0.123', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'weapon4': '0.618', 'WEAPON3': '0.800', 'weapon3': '2.796', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.200'} +[2023-09-14 12:37:55,031][75253] Sum rewards: 5.421, reward structure: {'HEALTH': '-3.150', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.013', 'AMMO5': '0.015', 'AMMO4': '0.066', 'AMMO3': '0.066', 'weapon2': '0.152', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.344', 'WEAPON3': '0.600', 'weapon5': '0.604', 'weapon3': '2.560', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.550'} +[2023-09-14 12:37:56,044][75215] DAMAGECOUNT value on done: 36.0 +[2023-09-14 12:37:56,044][75215] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:37:56,229][75215] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:37:56,475][75209] Updated weights for policy 1, policy_version 531 (0.0013) +[2023-09-14 12:37:56,619][109198] Fps is (10 sec: 14335.9, 60 sec: 10831.7, 300 sec: 10831.7). Total num frames: 7319552. Throughput: 0: 1559.4, 1: 1115.8. Samples: 120388. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:37:56,620][109198] Avg episode reward: [(0, '4.320')] +[2023-09-14 12:37:56,621][74942] Saving new best policy, reward=4.320! +[2023-09-14 12:37:56,637][75215] DAMAGECOUNT value on done: 230.0 +[2023-09-14 12:37:56,637][75215] DAMAGECOUNT value on done: 215.0 +[2023-09-14 12:37:56,638][75215] Sum rewards: 6.437, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.008', 'AMMO5': '0.010', 'AMMO3': '0.039', 'AMMO4': '0.041', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.836', 'weapon5': '0.990', 'FRAGCOUNT': '2.000', 'weapon3': '2.112', 'DAMAGECOUNT': '2.300'} +[2023-09-14 12:37:56,638][75215] Sum rewards: 2.275, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'AMMO4': '-0.003', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.017', 'weapon4': '0.038', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'WEAPON5': '0.400', 'weapon5': '0.444', 'weapon2': '0.748', 'WEAPON3': '0.800', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '2.150', 'weapon3': '2.474'} +[2023-09-14 12:37:56,750][75218] DAMAGECOUNT value on done: 65.0 +[2023-09-14 12:37:56,750][75218] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:37:56,926][75214] Updated weights for policy 0, policy_version 1257 (0.0013) +[2023-09-14 12:37:56,937][75218] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:37:57,274][75218] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:37:57,275][75218] DAMAGECOUNT value on done: 45.0 +[2023-09-14 12:37:57,275][75218] Sum rewards: 4.505, reward structure: {'HEALTH': '-0.450', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.020', 'AMMO4': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.270', 'weapon4': '0.576', 'weapon3': '0.668', 'weapon5': '0.896', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.000'} +[2023-09-14 12:37:57,276][75218] Sum rewards: 0.874, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.008', 'AMMO3': '0.070', 'weapon5': '0.098', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.450', 'weapon2': '0.454', 'weapon4': '0.552', 'WEAPON3': '0.600', 'weapon3': '2.336'} +[2023-09-14 12:37:57,703][75217] DAMAGECOUNT value on done: 212.0 +[2023-09-14 12:37:57,704][75217] DAMAGECOUNT value on done: 165.0 +[2023-09-14 12:37:57,705][75217] Sum rewards: 5.886, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.007', 'weapon2': '0.044', 'AMMO3': '0.048', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.482', 'weapon5': '1.488', 'weapon3': '1.496', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.120'} +[2023-09-14 12:37:57,705][75217] Sum rewards: 0.386, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.024', 'AMMO3': '0.047', 'weapon5': '0.054', 'AMMO4': '0.119', 'weapon2': '0.176', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'weapon4': '0.766', 'FRAGCOUNT': '0.999', 'weapon3': '1.640', 'DAMAGECOUNT': '1.650'} +[2023-09-14 12:37:57,801][75219] DAMAGECOUNT value on done: 205.0 +[2023-09-14 12:37:57,801][75219] Sum rewards: 6.653, reward structure: {'HEALTH': '-0.100', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.370', 'FRAGCOUNT': '1.000', 'weapon3': '1.010', 'weapon5': '1.798', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:37:57,802][75219] DAMAGECOUNT value on done: 10.0 +[2023-09-14 12:37:57,877][75217] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:37:57,888][75218] DAMAGECOUNT value on done: 168.0 +[2023-09-14 12:37:57,888][75218] DAMAGECOUNT value on done: 215.0 +[2023-09-14 12:37:57,889][75218] Sum rewards: 2.902, reward structure: {'HEALTH': '-2.050', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.015', 'weapon2': '0.050', 'AMMO3': '0.059', 'AMMO4': '0.076', 'WEAPON5': '0.100', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon4': '0.978', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.680', 'weapon3': '2.180'} +[2023-09-14 12:37:57,889][75218] Sum rewards: 4.623, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.011', 'AMMO4': '0.053', 'AMMO3': '0.058', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.336', 'weapon4': '0.412', 'WEAPON3': '0.500', 'weapon2': '0.658', 'FRAGCOUNT': '1.999', 'weapon3': '2.036', 'DAMAGECOUNT': '2.150'} +[2023-09-14 12:37:58,240][75217] DAMAGECOUNT value on done: 32.0 +[2023-09-14 12:37:58,240][75217] DAMAGECOUNT value on done: 10.0 +[2023-09-14 12:37:58,387][75219] DAMAGECOUNT value on done: 60.0 +[2023-09-14 12:37:58,387][75219] DAMAGECOUNT value on done: 213.0 +[2023-09-14 12:37:58,388][75219] Sum rewards: 6.148, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.224', 'WEAPON3': '0.400', 'weapon4': '0.450', 'weapon5': '0.470', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.130', 'weapon3': '2.226'} +[2023-09-14 12:37:58,419][75253] DAMAGECOUNT value on done: 130.0 +[2023-09-14 12:37:58,420][75253] DAMAGECOUNT value on done: 95.0 +[2023-09-14 12:37:58,420][75253] Sum rewards: 1.805, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.049', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.462', 'weapon4': '0.508', 'weapon2': '0.598', 'DAMAGECOUNT': '1.300', 'weapon3': '2.032'} +[2023-09-14 12:37:58,421][75253] Sum rewards: 2.915, reward structure: {'HEALTH': '-1.550', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.320', 'weapon2': '0.388', 'WEAPON3': '0.400', 'weapon5': '0.872', 'DAMAGECOUNT': '0.950', 'weapon3': '2.188'} +[2023-09-14 12:37:58,475][75218] DAMAGECOUNT value on done: 30.0 +[2023-09-14 12:37:58,475][75218] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:37:58,476][75218] Sum rewards: 5.986, reward structure: {'HEALTH': '-0.300', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'weapon2': '0.046', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.224', 'weapon3': '0.982', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon5': '2.610'} +[2023-09-14 12:37:58,504][75252] DAMAGECOUNT value on done: 173.0 +[2023-09-14 12:37:58,505][75252] Sum rewards: 3.111, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.033', 'weapon5': '0.064', 'WEAPON5': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.430', 'FRAGCOUNT': '1.000', 'weapon3': '1.378', 'DAMAGECOUNT': '1.730'} +[2023-09-14 12:37:58,505][75252] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:37:58,505][75252] Sum rewards: 2.757, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.018', 'AMMO3': '0.081', 'AMMO4': '0.087', 'WEAPON5': '0.200', 'weapon5': '0.298', 'WEAPON4': '0.300', 'weapon2': '0.304', 'WEAPON3': '0.600', 'weapon4': '0.952', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '1.858'} +[2023-09-14 12:37:58,594][75219] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:37:58,743][75252] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:37:58,841][75217] DAMAGECOUNT value on done: 121.0 +[2023-09-14 12:37:58,843][75217] Sum rewards: 4.644, reward structure: {'HEALTH': '-0.950', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.024', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon2': '0.152', 'WEAPON3': '0.200', 'weapon4': '0.262', 'weapon3': '0.854', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.210', 'weapon5': '1.664'} +[2023-09-14 12:37:58,844][75217] DAMAGECOUNT value on done: 95.0 +[2023-09-14 12:37:58,929][75219] DAMAGECOUNT value on done: 55.0 +[2023-09-14 12:37:58,930][75219] DAMAGECOUNT value on done: 295.0 +[2023-09-14 12:37:58,931][75219] Sum rewards: 7.326, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.050', 'AMMO3': '0.052', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.512', 'weapon4': '0.522', 'weapon5': '1.090', 'weapon3': '1.436', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.950'} +[2023-09-14 12:37:59,093][75253] DAMAGECOUNT value on done: 12.0 +[2023-09-14 12:37:59,093][75253] DAMAGECOUNT value on done: 30.0 +[2023-09-14 12:37:59,094][75253] Sum rewards: 1.796, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.005', 'AMMO4': '0.024', 'AMMO3': '0.051', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.120', 'weapon4': '0.248', 'weapon2': '0.290', 'WEAPON3': '0.400', 'weapon5': '1.024', 'weapon3': '1.432'} +[2023-09-14 12:37:59,103][75252] DAMAGECOUNT value on done: 10.0 +[2023-09-14 12:37:59,103][75252] DAMAGECOUNT value on done: 12.0 +[2023-09-14 12:37:59,237][75216] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:37:59,238][75216] DAMAGECOUNT value on done: 110.0 +[2023-09-14 12:37:59,239][75216] Sum rewards: 6.223, reward structure: {'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.015', 'weapon2': '0.016', 'AMMO3': '0.020', 'AMMO4': '0.074', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.532', 'weapon3': '0.862', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon5': '2.200'} +[2023-09-14 12:37:59,493][75217] DAMAGECOUNT value on done: 30.0 +[2023-09-14 12:37:59,493][75217] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:37:59,519][75219] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:37:59,520][75219] DAMAGECOUNT value on done: 30.0 +[2023-09-14 12:37:59,521][75216] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:37:59,890][75252] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:37:59,891][75252] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:37:59,891][75252] Sum rewards: 1.939, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.004', 'AMMO2': '0.010', 'AMMO3': '0.049', 'AMMO4': '0.050', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.216', 'WEAPON3': '0.400', 'weapon4': '0.596', 'weapon5': '0.980', 'weapon3': '1.334'} +[2023-09-14 12:37:59,935][75216] DAMAGECOUNT value on done: 208.0 +[2023-09-14 12:37:59,936][75216] Sum rewards: 3.081, reward structure: {'HEALTH': '-2.600', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.011', 'AMMO5': '0.012', 'AMMO4': '0.056', 'AMMO3': '0.072', 'WEAPON4': '0.200', 'weapon4': '0.294', 'WEAPON5': '0.300', 'weapon5': '0.408', 'weapon2': '0.410', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '2.080', 'weapon3': '2.236'} +[2023-09-14 12:37:59,936][75216] DAMAGECOUNT value on done: 260.0 +[2023-09-14 12:37:59,936][75216] Sum rewards: 6.828, reward structure: {'HEALTH': '-1.350', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.013', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.252', 'weapon2': '0.366', 'WEAPON3': '0.400', 'weapon5': '1.138', 'FRAGCOUNT': '2.000', 'weapon3': '2.056', 'DAMAGECOUNT': '2.600'} +[2023-09-14 12:38:00,236][75215] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:38:00,237][75215] DAMAGECOUNT value on done: 65.0 +[2023-09-14 12:38:00,237][75215] Sum rewards: 5.756, reward structure: {'HEALTH': '-0.650', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.019', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.344', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.092', 'weapon5': '2.626'} +[2023-09-14 12:38:00,238][75215] Sum rewards: -0.390, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.007', 'AMMO4': '0.034', 'AMMO3': '0.048', 'WEAPON5': '0.100', 'weapon4': '0.146', 'weapon5': '0.158', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.518', 'DAMAGECOUNT': '0.650', 'weapon3': '1.346'} +[2023-09-14 12:38:00,489][75252] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:38:00,489][75252] DAMAGECOUNT value on done: 64.0 +[2023-09-14 12:38:00,579][75216] DAMAGECOUNT value on done: 5.0 +[2023-09-14 12:38:00,579][75216] DAMAGECOUNT value on done: 50.0 +[2023-09-14 12:38:00,610][75254] DAMAGECOUNT value on done: 115.0 +[2023-09-14 12:38:00,610][75254] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:38:00,611][75254] Sum rewards: 4.088, reward structure: {'HEALTH': '-0.250', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.049', 'weapon2': '0.070', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.198', 'WEAPON3': '0.200', 'weapon4': '0.452', 'weapon3': '0.986', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150'} +[2023-09-14 12:38:00,823][75254] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:38:00,857][75215] DAMAGECOUNT value on done: 35.0 +[2023-09-14 12:38:00,857][75215] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:38:00,858][75215] Sum rewards: 2.594, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.692', 'weapon5': '1.436', 'weapon3': '1.878'} +[2023-09-14 12:38:01,398][75254] DAMAGECOUNT value on done: 20.0 +[2023-09-14 12:38:01,398][75254] DAMAGECOUNT value on done: 45.0 +[2023-09-14 12:38:01,399][75254] Sum rewards: 1.904, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.010', 'AMMO4': '0.050', 'AMMO3': '0.053', 'WEAPON5': '0.100', 'weapon2': '0.158', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.450', 'weapon4': '0.608', 'weapon5': '0.774', 'weapon3': '1.098'} +[2023-09-14 12:38:01,430][75216] DAMAGECOUNT value on done: 130.0 +[2023-09-14 12:38:01,431][75216] Sum rewards: 3.852, reward structure: {'HEALTH': '-0.450', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.050', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.306', 'weapon4': '0.394', 'weapon3': '0.922', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.300'} +[2023-09-14 12:38:01,430][75216] DAMAGECOUNT value on done: 45.0 +[2023-09-14 12:38:01,619][109198] Fps is (10 sec: 13926.4, 60 sec: 11059.2, 300 sec: 11059.2). Total num frames: 7385088. Throughput: 0: 1676.3, 1: 1333.4. Samples: 135650. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:38:01,620][109198] Avg episode reward: [(0, '3.747'), (1, '2.728')] +[2023-09-14 12:38:02,130][75254] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:38:02,130][75254] DAMAGECOUNT value on done: 280.0 +[2023-09-14 12:38:02,131][75254] Sum rewards: 7.995, reward structure: {'HEALTH': '-0.150', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'weapon4': '0.098', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.350', 'weapon3': '1.028', 'weapon5': '1.446', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.800'} +[2023-09-14 12:38:02,358][75209] Updated weights for policy 1, policy_version 541 (0.0012) +[2023-09-14 12:38:02,754][75254] DAMAGECOUNT value on done: 205.0 +[2023-09-14 12:38:02,754][75254] DAMAGECOUNT value on done: 155.0 +[2023-09-14 12:38:02,755][75254] Sum rewards: 6.024, reward structure: {'HEALTH': '-1.550', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.328', 'weapon2': '0.360', 'WEAPON3': '0.400', 'weapon5': '1.140', 'weapon3': '1.948', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:38:02,755][75254] Sum rewards: 2.768, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO4': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.059', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.278', 'WEAPON3': '0.500', 'weapon2': '0.510', 'weapon4': '0.566', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.550', 'weapon3': '1.894'} +[2023-09-14 12:38:03,003][75214] Updated weights for policy 0, policy_version 1267 (0.0012) +[2023-09-14 12:38:06,619][109198] Fps is (10 sec: 14336.0, 60 sec: 11468.8, 300 sec: 11468.8). Total num frames: 7462912. Throughput: 0: 1829.0, 1: 1419.1. Samples: 150977. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:38:06,620][109198] Avg episode reward: [(0, '3.919'), (1, '2.659')] +[2023-09-14 12:38:07,616][75209] Updated weights for policy 1, policy_version 551 (0.0012) +[2023-09-14 12:38:08,797][75214] Updated weights for policy 0, policy_version 1277 (0.0013) +[2023-09-14 12:38:11,619][109198] Fps is (10 sec: 14745.6, 60 sec: 11673.6, 300 sec: 11673.6). Total num frames: 7532544. Throughput: 0: 1933.9, 1: 1591.6. Samples: 172937. Policy #0 lag: (min: 0.0, avg: 0.3, max: 2.0) +[2023-09-14 12:38:11,620][109198] Avg episode reward: [(0, '3.919'), (1, '2.659')] +[2023-09-14 12:38:13,083][75209] Updated weights for policy 1, policy_version 561 (0.0012) +[2023-09-14 12:38:14,833][75214] Updated weights for policy 0, policy_version 1287 (0.0012) +[2023-09-14 12:38:16,619][109198] Fps is (10 sec: 14745.7, 60 sec: 12970.7, 300 sec: 11972.9). Total num frames: 7610368. Throughput: 0: 1931.3, 1: 1670.5. Samples: 189839. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:38:16,620][109198] Avg episode reward: [(0, '3.919'), (1, '2.659')] +[2023-09-14 12:38:18,054][75209] Updated weights for policy 1, policy_version 571 (0.0012) +[2023-09-14 12:38:20,511][75214] Updated weights for policy 0, policy_version 1297 (0.0014) +[2023-09-14 12:38:21,619][109198] Fps is (10 sec: 14745.6, 60 sec: 14063.0, 300 sec: 12112.5). Total num frames: 7680000. Throughput: 0: 1891.8, 1: 1701.3. Samples: 206476. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0) +[2023-09-14 12:38:21,620][109198] Avg episode reward: [(0, '3.919'), (1, '2.659')] +[2023-09-14 12:38:23,325][75209] Updated weights for policy 1, policy_version 581 (0.0013) +[2023-09-14 12:38:26,471][75214] Updated weights for policy 0, policy_version 1307 (0.0013) +[2023-09-14 12:38:26,619][109198] Fps is (10 sec: 14745.6, 60 sec: 14404.3, 300 sec: 12342.6). Total num frames: 7757824. Throughput: 0: 1836.8, 1: 1755.5. Samples: 228146. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:38:26,620][109198] Avg episode reward: [(0, '3.919'), (1, '2.659')] +[2023-09-14 12:38:28,710][75209] Updated weights for policy 1, policy_version 591 (0.0015) +[2023-09-14 12:38:30,318][75219] DAMAGECOUNT value on done: 405.0 +[2023-09-14 12:38:30,318][75219] DAMAGECOUNT value on done: 385.0 +[2023-09-14 12:38:30,319][75219] Sum rewards: 3.032, reward structure: {'HEALTH': '-3.650', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'weapon5': '0.028', 'weapon2': '0.038', 'AMMO2': '0.043', 'AMMO3': '0.099', 'AMMO4': '0.215', 'WEAPON4': '0.300', 'weapon4': '0.386', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'DAMAGECOUNT': '2.000', 'FRAGCOUNT': '2.000', 'weapon3': '3.352'} +[2023-09-14 12:38:30,319][75219] Sum rewards: 7.420, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.017', 'AMMO3': '0.057', 'AMMO4': '0.084', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.248', 'weapon2': '0.414', 'WEAPON3': '0.500', 'weapon5': '0.530', 'weapon3': '2.410', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.750'} +[2023-09-14 12:38:30,844][75219] DAMAGECOUNT value on done: 380.0 +[2023-09-14 12:38:30,845][75219] Sum rewards: 6.972, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.015', 'AMMO3': '0.056', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.298', 'weapon2': '0.476', 'WEAPON3': '0.500', 'weapon5': '0.734', 'weapon3': '2.280', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.200'} +[2023-09-14 12:38:30,844][75219] DAMAGECOUNT value on done: 413.0 +[2023-09-14 12:38:30,845][75219] Sum rewards: 2.875, reward structure: {'HEALTH': '-3.200', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.012', 'AMMO4': '0.024', 'weapon2': '0.034', 'AMMO3': '0.107', 'weapon5': '0.146', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.544', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.000', 'weapon3': '2.902'} +[2023-09-14 12:38:31,619][109198] Fps is (10 sec: 14745.7, 60 sec: 14472.5, 300 sec: 12441.6). Total num frames: 7827456. Throughput: 0: 1809.3, 1: 1804.6. Samples: 244875. Policy #0 lag: (min: 0.0, avg: 0.3, max: 2.0) +[2023-09-14 12:38:31,620][109198] Avg episode reward: [(0, '4.032'), (1, '2.659')] +[2023-09-14 12:38:31,716][75253] DAMAGECOUNT value on done: 150.0 +[2023-09-14 12:38:31,717][75253] DAMAGECOUNT value on done: 245.0 +[2023-09-14 12:38:31,718][75253] Sum rewards: 3.961, reward structure: {'HEALTH': '-0.630', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.050', 'weapon5': '0.056', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.242', 'weapon4': '0.374', 'weapon3': '0.836', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.600'} +[2023-09-14 12:38:32,324][75253] DAMAGECOUNT value on done: 365.0 +[2023-09-14 12:38:32,325][75253] DAMAGECOUNT value on done: 430.0 +[2023-09-14 12:38:32,325][75253] Sum rewards: 4.670, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.009', 'AMMO4': '0.025', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.416', 'weapon2': '0.492', 'weapon5': '0.962', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.100', 'weapon3': '1.922'} +[2023-09-14 12:38:32,764][75214] Updated weights for policy 0, policy_version 1317 (0.0013) +[2023-09-14 12:38:33,567][75218] DAMAGECOUNT value on done: 30.0 +[2023-09-14 12:38:33,567][75218] DAMAGECOUNT value on done: 65.0 +[2023-09-14 12:38:33,568][75218] Sum rewards: 2.507, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.021', 'AMMO3': '0.042', 'AMMO4': '0.104', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.300', 'weapon5': '0.308', 'weapon4': '0.358', 'WEAPON3': '0.400', 'weapon2': '0.454', 'weapon3': '2.112'} +[2023-09-14 12:38:33,582][75216] Large shaping reward 2.942 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 2.0), ('DAMAGECOUNT', 1.94, 194.0), ('weapon5', 0.002)] +[2023-09-14 12:38:34,152][75218] DAMAGECOUNT value on done: 345.0 +[2023-09-14 12:38:34,152][75218] DAMAGECOUNT value on done: 350.0 +[2023-09-14 12:38:34,153][75218] Sum rewards: 3.818, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.015', 'AMMO4': '0.075', 'weapon5': '0.090', 'AMMO3': '0.105', 'WEAPON4': '0.200', 'weapon4': '0.228', 'WEAPON5': '0.300', 'weapon2': '0.444', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.450', 'weapon3': '3.096'} +[2023-09-14 12:38:34,153][75218] Sum rewards: 6.422, reward structure: {'HEALTH': '-2.400', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.004', 'AMMO5': '0.010', 'AMMO2': '0.018', 'AMMO3': '0.052', 'AMMO4': '0.090', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon5': '0.410', 'WEAPON3': '0.500', 'weapon4': '0.566', 'weapon3': '2.622', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.050'} +[2023-09-14 12:38:34,225][75209] Updated weights for policy 1, policy_version 601 (0.0016) +[2023-09-14 12:38:34,361][75215] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:38:34,361][75215] DAMAGECOUNT value on done: 146.0 +[2023-09-14 12:38:34,361][75215] Sum rewards: 2.843, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.006', 'AMMO5': '0.014', 'AMMO4': '0.028', 'AMMO3': '0.085', 'weapon2': '0.282', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.584', 'WEAPON3': '0.600', 'weapon5': '0.636', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '1.958'} +[2023-09-14 12:38:34,362][75215] Sum rewards: 4.650, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.714', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon5': '1.292', 'weapon3': '2.004'} +[2023-09-14 12:38:34,760][75218] DAMAGECOUNT value on done: 215.0 +[2023-09-14 12:38:34,760][75218] DAMAGECOUNT value on done: 233.0 +[2023-09-14 12:38:34,761][75218] Sum rewards: 2.931, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.015', 'AMMO3': '0.040', 'AMMO4': '0.076', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.282', 'weapon5': '0.318', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.650', 'weapon4': '0.704', 'weapon3': '2.038'} +[2023-09-14 12:38:34,908][75215] DAMAGECOUNT value on done: 260.0 +[2023-09-14 12:38:34,909][75215] DAMAGECOUNT value on done: 312.0 +[2023-09-14 12:38:34,909][75215] Sum rewards: 2.972, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.022', 'AMMO3': '0.051', 'AMMO4': '0.109', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon2': '0.204', 'weapon4': '0.330', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.970', 'weapon5': '1.310', 'weapon3': '1.468'} +[2023-09-14 12:38:35,333][75218] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:38:35,333][75218] DAMAGECOUNT value on done: 197.0 +[2023-09-14 12:38:35,334][75218] Sum rewards: 2.955, reward structure: {'HEALTH': '-1.420', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.314', 'weapon2': '0.346', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.700', 'weapon5': '1.178', 'weapon3': '2.090'} +[2023-09-14 12:38:35,467][75219] DAMAGECOUNT value on done: 256.0 +[2023-09-14 12:38:35,467][75219] DAMAGECOUNT value on done: 500.0 +[2023-09-14 12:38:35,468][75219] Sum rewards: 2.326, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.015', 'AMMO3': '0.034', 'AMMO4': '0.074', 'WEAPON5': '0.100', 'weapon5': '0.170', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.420', 'weapon4': '0.670', 'FRAGCOUNT': '1.000', 'weapon3': '1.330', 'DAMAGECOUNT': '2.010'} +[2023-09-14 12:38:35,468][75219] Sum rewards: 5.543, reward structure: {'HEALTH': '-1.780', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.008', 'AMMO4': '0.040', 'AMMO3': '0.040', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.350', 'WEAPON3': '0.400', 'weapon4': '0.424', 'weapon5': '0.646', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050', 'weapon3': '2.060'} +[2023-09-14 12:38:35,526][75217] DAMAGECOUNT value on done: 317.0 +[2023-09-14 12:38:35,527][75217] DAMAGECOUNT value on done: 237.0 +[2023-09-14 12:38:35,527][75217] Sum rewards: 4.308, reward structure: {'HEALTH': '-1.020', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'AMMO3': '0.040', 'AMMO4': '0.075', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.534', 'weapon5': '0.564', 'weapon4': '0.606', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '1.740'} +[2023-09-14 12:38:35,720][75253] DAMAGECOUNT value on done: 185.0 +[2023-09-14 12:38:35,721][75253] DAMAGECOUNT value on done: 110.0 +[2023-09-14 12:38:35,721][75253] Sum rewards: 2.541, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.150', 'WEAPON3': '0.200', 'weapon2': '0.706', 'weapon3': '0.888', 'weapon5': '2.474'} +[2023-09-14 12:38:35,995][75219] DAMAGECOUNT value on done: 353.0 +[2023-09-14 12:38:35,995][75219] DAMAGECOUNT value on done: 140.0 +[2023-09-14 12:38:35,996][75219] Sum rewards: 6.954, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO5': '0.007', 'AMMO2': '0.015', 'AMMO3': '0.040', 'AMMO4': '0.073', 'weapon5': '0.186', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.404', 'weapon3': '1.996', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '3.530'} +[2023-09-14 12:38:35,996][75219] Sum rewards: 2.196, reward structure: {'HEALTH': '-2.680', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.014', 'AMMO5': '0.015', 'AMMO4': '0.071', 'AMMO3': '0.075', 'weapon2': '0.108', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon5': '0.504', 'WEAPON3': '0.600', 'weapon4': '0.728', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '2.160'} +[2023-09-14 12:38:36,101][75217] DAMAGECOUNT value on done: 132.0 +[2023-09-14 12:38:36,101][75217] DAMAGECOUNT value on done: 120.0 +[2023-09-14 12:38:36,102][75217] Sum rewards: 2.674, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.017', 'AMMO3': '0.080', 'AMMO4': '0.084', 'weapon5': '0.148', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon2': '0.348', 'WEAPON3': '0.600', 'weapon4': '0.906', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '1.878'} +[2023-09-14 12:38:36,102][75217] Sum rewards: 4.655, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.298', 'FRAGCOUNT': '1.000', 'weapon3': '1.092', 'DAMAGECOUNT': '1.100', 'weapon5': '2.710'} +[2023-09-14 12:38:36,239][75252] DAMAGECOUNT value on done: 417.0 +[2023-09-14 12:38:36,239][75252] DAMAGECOUNT value on done: 390.0 +[2023-09-14 12:38:36,240][75252] Sum rewards: 4.150, reward structure: {'HEALTH': '-2.800', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO5': '0.012', 'AMMO2': '0.013', 'AMMO4': '0.067', 'AMMO3': '0.073', 'WEAPON4': '0.200', 'weapon5': '0.290', 'WEAPON5': '0.300', 'weapon4': '0.390', 'WEAPON3': '0.600', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.440', 'weapon3': '2.562'} +[2023-09-14 12:38:36,240][75252] Sum rewards: 5.150, reward structure: {'HEALTH': '-2.290', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.010', 'AMMO3': '0.077', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.288', 'weapon2': '0.410', 'weapon5': '0.522', 'WEAPON3': '0.600', 'FRAGCOUNT': '2.000', 'weapon3': '2.378', 'DAMAGECOUNT': '2.850'} +[2023-09-14 12:38:36,332][75253] DAMAGECOUNT value on done: 172.0 +[2023-09-14 12:38:36,332][75253] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:38:36,333][75253] Sum rewards: 3.105, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.015', 'AMMO3': '0.040', 'AMMO4': '0.075', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.206', 'WEAPON3': '0.400', 'weapon5': '0.580', 'weapon4': '0.712', 'FRAGCOUNT': '0.998', 'DAMAGECOUNT': '1.600', 'weapon3': '2.072'} +[2023-09-14 12:38:36,500][75217] DAMAGECOUNT value on done: 186.0 +[2023-09-14 12:38:36,500][75217] DAMAGECOUNT value on done: 163.0 +[2023-09-14 12:38:36,501][75217] Sum rewards: 2.675, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'AMMO3': '0.048', 'AMMO4': '0.074', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.490', 'weapon4': '0.548', 'DAMAGECOUNT': '0.650', 'weapon2': '0.760', 'weapon3': '1.436'} +[2023-09-14 12:38:36,501][75217] Sum rewards: 2.276, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.008', 'AMMO3': '0.036', 'AMMO4': '0.038', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.300', 'weapon4': '0.360', 'weapon2': '0.408', 'DAMAGECOUNT': '0.680', 'weapon3': '1.040', 'weapon5': '1.202'} +[2023-09-14 12:38:36,619][109198] Fps is (10 sec: 13926.3, 60 sec: 14472.5, 300 sec: 12528.9). Total num frames: 7897088. Throughput: 0: 1744.4, 1: 1836.4. Samples: 259640. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:38:36,620][109198] Avg episode reward: [(0, '4.024'), (1, '2.752')] +[2023-09-14 12:38:36,718][75252] DAMAGECOUNT value on done: 40.0 +[2023-09-14 12:38:36,718][75252] DAMAGECOUNT value on done: 78.0 +[2023-09-14 12:38:37,064][75217] DAMAGECOUNT value on done: 218.0 +[2023-09-14 12:38:37,065][75217] DAMAGECOUNT value on done: 70.0 +[2023-09-14 12:38:37,065][75217] Sum rewards: 4.290, reward structure: {'HEALTH': '-0.700', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.020', 'weapon2': '0.048', 'AMMO4': '0.099', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.148', 'WEAPON3': '0.200', 'weapon4': '0.616', 'weapon3': '0.754', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.880'} +[2023-09-14 12:38:37,341][75252] DAMAGECOUNT value on done: 5.0 +[2023-09-14 12:38:37,341][75252] DAMAGECOUNT value on done: 65.0 +[2023-09-14 12:38:38,011][75252] DAMAGECOUNT value on done: 169.0 +[2023-09-14 12:38:38,011][75252] DAMAGECOUNT value on done: 104.0 +[2023-09-14 12:38:38,012][75252] Sum rewards: 4.528, reward structure: {'HEALTH': '-1.250', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.010', 'weapon2': '0.036', 'AMMO3': '0.040', 'AMMO4': '0.049', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.560', 'weapon4': '0.648', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.690', 'weapon3': '1.938'} +[2023-09-14 12:38:38,212][75216] DAMAGECOUNT value on done: 371.0 +[2023-09-14 12:38:38,212][75216] DAMAGECOUNT value on done: 165.0 +[2023-09-14 12:38:38,213][75216] Sum rewards: 3.386, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.022', 'AMMO3': '0.059', 'AMMO4': '0.107', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon2': '0.362', 'WEAPON3': '0.500', 'weapon4': '0.548', 'weapon5': '0.580', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.650', 'weapon3': '2.050'} +[2023-09-14 12:38:38,382][75215] DAMAGECOUNT value on done: 70.0 +[2023-09-14 12:38:38,382][75215] DAMAGECOUNT value on done: 190.0 +[2023-09-14 12:38:38,383][75215] Sum rewards: 2.399, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.004', 'FRAGCOUNT': '-0.001', 'AMMO2': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.188', 'weapon2': '0.194', 'WEAPON3': '0.400', 'weapon5': '0.444', 'DAMAGECOUNT': '0.850', 'weapon3': '2.084'} +[2023-09-14 12:38:38,952][75216] DAMAGECOUNT value on done: 421.0 +[2023-09-14 12:38:38,952][75216] DAMAGECOUNT value on done: 370.0 +[2023-09-14 12:38:38,952][75216] Sum rewards: 5.509, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.042', 'AMMO4': '0.050', 'weapon5': '0.052', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.254', 'WEAPON3': '0.400', 'weapon4': '0.654', 'weapon3': '1.714', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.130'} +[2023-09-14 12:38:38,953][75216] Sum rewards: 2.499, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.005', 'AMMO4': '0.014', 'AMMO3': '0.067', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.180', 'weapon2': '0.272', 'weapon4': '0.358', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '2.800'} +[2023-09-14 12:38:38,955][75215] DAMAGECOUNT value on done: 125.0 +[2023-09-14 12:38:38,956][75215] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:38:38,956][75215] Sum rewards: 2.379, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.003', 'AMMO4': '0.011', 'AMMO3': '0.032', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON6': '0.200', 'weapon6': '0.208', 'weapon4': '0.282', 'WEAPON3': '0.300', 'weapon5': '0.324', 'weapon2': '0.496', 'DAMAGECOUNT': '0.900', 'weapon3': '1.222'} +[2023-09-14 12:38:38,957][75215] Sum rewards: 1.090, reward structure: {'HEALTH': '-1.700', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO2': '0.008', 'AMMO5': '0.009', 'AMMO4': '0.038', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.274', 'WEAPON3': '0.400', 'weapon4': '0.412', 'weapon2': '0.466', 'weapon3': '1.844'} +[2023-09-14 12:38:39,080][75214] Updated weights for policy 0, policy_version 1327 (0.0013) +[2023-09-14 12:38:39,511][75209] Updated weights for policy 1, policy_version 611 (0.0012) +[2023-09-14 12:38:39,659][75216] DAMAGECOUNT value on done: 70.0 +[2023-09-14 12:38:39,659][75216] DAMAGECOUNT value on done: 25.0 +[2023-09-14 12:38:39,660][75216] Sum rewards: 2.726, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.746', 'weapon5': '1.086', 'weapon3': '2.106'} +[2023-09-14 12:38:39,708][75254] DAMAGECOUNT value on done: 123.0 +[2023-09-14 12:38:39,709][75254] DAMAGECOUNT value on done: 36.0 +[2023-09-14 12:38:40,157][75216] DAMAGECOUNT value on done: 339.0 +[2023-09-14 12:38:40,157][75216] DAMAGECOUNT value on done: 70.0 +[2023-09-14 12:38:40,157][75216] Sum rewards: 5.200, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.013', 'AMMO3': '0.052', 'AMMO4': '0.065', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon2': '0.212', 'WEAPON3': '0.400', 'weapon4': '0.506', 'FRAGCOUNT': '0.999', 'weapon5': '1.300', 'weapon3': '1.358', 'DAMAGECOUNT': '2.090'} +[2023-09-14 12:38:40,290][75254] DAMAGECOUNT value on done: 320.0 +[2023-09-14 12:38:40,291][75254] DAMAGECOUNT value on done: 440.0 +[2023-09-14 12:38:40,291][75254] Sum rewards: 4.346, reward structure: {'HEALTH': '-3.850', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.015', 'weapon5': '0.016', 'AMMO5': '0.020', 'AMMO4': '0.075', 'AMMO3': '0.079', 'weapon2': '0.120', 'WEAPON4': '0.200', 'weapon4': '0.384', 'WEAPON5': '0.400', 'WEAPON3': '0.700', 'DAMAGECOUNT': '3.000', 'FRAGCOUNT': '3.000', 'weapon3': '3.186'} +[2023-09-14 12:38:40,292][75254] Sum rewards: 6.381, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.027', 'weapon2': '0.040', 'AMMO3': '0.100', 'AMMO4': '0.137', 'WEAPON4': '0.300', 'weapon4': '0.302', 'WEAPON5': '0.400', 'WEAPON3': '0.700', 'weapon5': '1.058', 'weapon3': '2.346', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.950'} +[2023-09-14 12:38:40,839][75254] DAMAGECOUNT value on done: 345.0 +[2023-09-14 12:38:40,840][75254] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:38:41,427][75254] DAMAGECOUNT value on done: 205.0 +[2023-09-14 12:38:41,427][75254] DAMAGECOUNT value on done: 160.0 +[2023-09-14 12:38:41,619][109198] Fps is (10 sec: 14336.0, 60 sec: 14404.2, 300 sec: 12652.1). Total num frames: 7970816. Throughput: 0: 1689.9, 1: 1881.1. Samples: 281083. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:38:41,620][109198] Avg episode reward: [(0, '3.949'), (1, '2.782')] +[2023-09-14 12:38:44,805][75214] Updated weights for policy 0, policy_version 1337 (0.0013) +[2023-09-14 12:38:45,045][75209] Updated weights for policy 1, policy_version 621 (0.0012) +[2023-09-14 12:38:46,619][109198] Fps is (10 sec: 14336.0, 60 sec: 14404.3, 300 sec: 12719.2). Total num frames: 8040448. Throughput: 0: 1692.0, 1: 1896.6. Samples: 297136. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:38:46,620][109198] Avg episode reward: [(0, '3.949'), (1, '2.782')] +[2023-09-14 12:38:50,394][75214] Updated weights for policy 0, policy_version 1347 (0.0013) +[2023-09-14 12:38:50,833][75209] Updated weights for policy 1, policy_version 631 (0.0014) +[2023-09-14 12:38:51,619][109198] Fps is (10 sec: 14336.0, 60 sec: 14472.5, 300 sec: 12820.5). Total num frames: 8114176. Throughput: 0: 1716.8, 1: 1888.5. Samples: 313219. Policy #0 lag: (min: 0.0, avg: 0.7, max: 1.0) +[2023-09-14 12:38:51,620][109198] Avg episode reward: [(0, '3.949'), (1, '2.782')] +[2023-09-14 12:38:55,270][75218] Large shaping reward 2.562 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 2.0), ('DAMAGECOUNT', 1.56, 156.0), ('weapon5', 0.002)] +[2023-09-14 12:38:55,789][75214] Updated weights for policy 0, policy_version 1357 (0.0012) +[2023-09-14 12:38:56,294][75209] Updated weights for policy 1, policy_version 641 (0.0013) +[2023-09-14 12:38:56,619][109198] Fps is (10 sec: 14745.7, 60 sec: 14472.5, 300 sec: 12912.2). Total num frames: 8187904. Throughput: 0: 1741.2, 1: 1883.5. Samples: 336048. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:38:56,620][109198] Avg episode reward: [(0, '3.949'), (1, '2.782')] +[2023-09-14 12:39:00,989][75214] Updated weights for policy 0, policy_version 1367 (0.0011) +[2023-09-14 12:39:01,560][75209] Updated weights for policy 1, policy_version 651 (0.0011) +[2023-09-14 12:39:01,619][109198] Fps is (10 sec: 15564.9, 60 sec: 14745.6, 300 sec: 13070.0). Total num frames: 8269824. Throughput: 0: 1752.4, 1: 1881.6. Samples: 353371. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:39:01,620][109198] Avg episode reward: [(0, '3.949'), (1, '2.782')] +[2023-09-14 12:39:01,624][75052] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000651_2666496.pth... +[2023-09-14 12:39:01,624][74942] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001368_5603328.pth... +[2023-09-14 12:39:01,688][74942] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001054_4317184.pth +[2023-09-14 12:39:01,688][75052] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000341_1396736.pth +[2023-09-14 12:39:05,101][75254] Large shaping reward 2.602 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 1.0), ('DAMAGECOUNT', 1.6, 160.0), ('weapon5', 0.002)] +[2023-09-14 12:39:06,278][75219] DAMAGECOUNT value on done: 725.0 +[2023-09-14 12:39:06,278][75219] DAMAGECOUNT value on done: 685.0 +[2023-09-14 12:39:06,279][75219] Sum rewards: 5.596, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.030', 'weapon2': '0.076', 'AMMO3': '0.123', 'AMMO4': '0.149', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'weapon4': '0.452', 'weapon5': '0.758', 'WEAPON3': '0.800', 'weapon3': '2.288', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.200'} +[2023-09-14 12:39:06,279][75219] Sum rewards: 5.183, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.019', 'weapon5': '0.020', 'weapon2': '0.052', 'AMMO3': '0.088', 'AMMO4': '0.093', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon4': '0.336', 'WEAPON3': '0.700', 'DAMAGECOUNT': '3.000', 'FRAGCOUNT': '3.000', 'weapon3': '3.260'} +[2023-09-14 12:39:06,400][75214] Updated weights for policy 0, policy_version 1377 (0.0012) +[2023-09-14 12:39:06,619][109198] Fps is (10 sec: 15564.8, 60 sec: 14677.4, 300 sec: 13142.8). Total num frames: 8343552. Throughput: 0: 1774.1, 1: 1875.1. Samples: 370689. Policy #0 lag: (min: 0.0, avg: 0.8, max: 3.0) +[2023-09-14 12:39:06,620][109198] Avg episode reward: [(0, '3.990'), (1, '2.782')] +[2023-09-14 12:39:06,784][75219] DAMAGECOUNT value on done: 555.0 +[2023-09-14 12:39:06,784][75219] DAMAGECOUNT value on done: 448.0 +[2023-09-14 12:39:06,784][75219] Sum rewards: 5.202, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.018', 'AMMO3': '0.040', 'AMMO4': '0.092', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.412', 'weapon4': '0.518', 'weapon2': '0.608', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.750', 'weapon3': '1.956'} +[2023-09-14 12:39:06,907][75209] Updated weights for policy 1, policy_version 661 (0.0012) +[2023-09-14 12:39:07,921][75253] DAMAGECOUNT value on done: 360.0 +[2023-09-14 12:39:07,922][75253] DAMAGECOUNT value on done: 181.0 +[2023-09-14 12:39:07,922][75253] Sum rewards: 3.926, reward structure: {'HEALTH': '-0.310', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO3': '0.019', 'AMMO4': '0.050', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.296', 'weapon2': '0.448', 'weapon3': '0.962', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150'} +[2023-09-14 12:39:08,410][75253] DAMAGECOUNT value on done: 565.0 +[2023-09-14 12:39:08,410][75253] DAMAGECOUNT value on done: 569.0 +[2023-09-14 12:39:08,411][75253] Sum rewards: 3.676, reward structure: {'HEALTH': '-1.650', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO4': '0.002', 'AMMO5': '0.007', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'weapon5': '0.286', 'WEAPON3': '0.400', 'weapon2': '0.876', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.390', 'weapon3': '2.124'} +[2023-09-14 12:39:09,096][75215] DAMAGECOUNT value on done: 301.0 +[2023-09-14 12:39:09,097][75215] DAMAGECOUNT value on done: 130.0 +[2023-09-14 12:39:09,097][75215] Sum rewards: 6.629, reward structure: {'HEALTH': '-0.250', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.716', 'FRAGCOUNT': '1.000', 'weapon3': '1.032', 'DAMAGECOUNT': '1.550', 'weapon5': '2.256'} +[2023-09-14 12:39:09,098][75215] Sum rewards: 0.688, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.010', 'AMMO4': '0.048', 'AMMO3': '0.048', 'weapon2': '0.054', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.250', 'weapon4': '0.342', 'WEAPON3': '0.400', 'weapon5': '1.368', 'weapon3': '1.860'} +[2023-09-14 12:39:09,441][75218] DAMAGECOUNT value on done: 125.0 +[2023-09-14 12:39:09,442][75218] DAMAGECOUNT value on done: 322.0 +[2023-09-14 12:39:09,442][75218] Sum rewards: 0.794, reward structure: {'HEALTH': '-2.680', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.024', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.059', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.268', 'weapon5': '0.498', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.950', 'weapon2': '1.092', 'weapon3': '1.828'} +[2023-09-14 12:39:09,443][75218] Sum rewards: 6.057, reward structure: {'HEALTH': '-0.950', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon5': '0.796', 'FRAGCOUNT': '1.000', 'weapon2': '1.056', 'weapon3': '1.232', 'DAMAGECOUNT': '2.570'} +[2023-09-14 12:39:09,642][75215] DAMAGECOUNT value on done: 522.0 +[2023-09-14 12:39:09,642][75215] DAMAGECOUNT value on done: 595.0 +[2023-09-14 12:39:09,643][75215] Sum rewards: 2.861, reward structure: {'HEALTH': '-3.350', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.019', 'weapon2': '0.068', 'AMMO4': '0.092', 'AMMO3': '0.115', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.466', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100', 'weapon3': '2.936'} +[2023-09-14 12:39:09,643][75215] Sum rewards: 7.292, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.013', 'AMMO5': '0.015', 'AMMO4': '0.065', 'AMMO3': '0.076', 'weapon2': '0.096', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.356', 'WEAPON3': '0.600', 'weapon5': '0.710', 'weapon3': '2.510', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.350'} +[2023-09-14 12:39:10,043][75218] DAMAGECOUNT value on done: 355.0 +[2023-09-14 12:39:10,043][75218] DAMAGECOUNT value on done: 498.0 +[2023-09-14 12:39:10,044][75218] Sum rewards: 4.358, reward structure: {'HEALTH': '-0.100', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.050', 'WEAPON4': '0.100', 'weapon2': '0.106', 'WEAPON3': '0.200', 'weapon4': '0.426', 'FRAGCOUNT': '1.000', 'weapon3': '1.066', 'DAMAGECOUNT': '1.480'} +[2023-09-14 12:39:10,078][75218] DAMAGECOUNT value on done: 353.0 +[2023-09-14 12:39:10,078][75218] DAMAGECOUNT value on done: 320.0 +[2023-09-14 12:39:10,078][75218] Sum rewards: 4.552, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.038', 'WEAPON5': '0.100', 'WEAPON3': '0.300', 'weapon2': '0.396', 'FRAGCOUNT': '1.000', 'weapon3': '1.106', 'DAMAGECOUNT': '1.200', 'weapon5': '2.438'} +[2023-09-14 12:39:10,079][75218] Sum rewards: 2.989, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'weapon2': '0.040', 'AMMO3': '0.060', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.414', 'WEAPON3': '0.500', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon5': '1.066', 'weapon3': '2.348'} +[2023-09-14 12:39:10,686][75218] DAMAGECOUNT value on done: 195.0 +[2023-09-14 12:39:10,686][75218] DAMAGECOUNT value on done: 212.0 +[2023-09-14 12:39:10,687][75218] Sum rewards: 2.249, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.004', 'AMMO4': '0.011', 'AMMO3': '0.043', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.276', 'weapon5': '0.388', 'WEAPON3': '0.400', 'weapon2': '0.422', 'DAMAGECOUNT': '0.950', 'weapon3': '1.604'} +[2023-09-14 12:39:11,145][75219] DAMAGECOUNT value on done: 376.0 +[2023-09-14 12:39:11,145][75219] DAMAGECOUNT value on done: 640.0 +[2023-09-14 12:39:11,146][75219] Sum rewards: 4.406, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.228', 'weapon2': '0.344', 'WEAPON3': '0.400', 'weapon5': '0.984', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.200', 'weapon3': '2.330'} +[2023-09-14 12:39:11,146][75219] Sum rewards: 3.188, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.015', 'AMMO4': '0.074', 'AMMO3': '0.075', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon2': '0.364', 'weapon5': '0.494', 'WEAPON3': '0.600', 'weapon4': '0.652', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.400', 'weapon3': '2.206'} +[2023-09-14 12:39:11,379][75217] DAMAGECOUNT value on done: 247.0 +[2023-09-14 12:39:11,379][75217] DAMAGECOUNT value on done: 452.0 +[2023-09-14 12:39:11,380][75217] Sum rewards: 3.069, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.037', 'AMMO4': '0.050', 'weapon2': '0.092', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.300', 'weapon4': '0.396', 'weapon5': '0.786', 'weapon3': '0.846', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.350'} +[2023-09-14 12:39:11,619][109198] Fps is (10 sec: 14745.6, 60 sec: 14745.6, 300 sec: 13209.6). Total num frames: 8417280. Throughput: 0: 1795.2, 1: 1873.0. Samples: 393218. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:39:11,620][109198] Avg episode reward: [(0, '4.011'), (1, '2.760')] +[2023-09-14 12:39:11,811][75219] DAMAGECOUNT value on done: 528.0 +[2023-09-14 12:39:11,811][75219] DAMAGECOUNT value on done: 380.0 +[2023-09-14 12:39:11,812][75219] Sum rewards: 2.650, reward structure: {'HEALTH': '-2.730', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'weapon5': '0.022', 'AMMO2': '0.028', 'AMMO3': '0.072', 'AMMO4': '0.140', 'WEAPON4': '0.200', 'weapon2': '0.232', 'weapon4': '0.292', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.750', 'weapon3': '2.728'} +[2023-09-14 12:39:11,812][75219] Sum rewards: 6.148, reward structure: {'HEALTH': '-1.750', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.228', 'weapon2': '0.310', 'WEAPON3': '0.400', 'weapon5': '1.160', 'FRAGCOUNT': '2.000', 'weapon3': '2.072', 'DAMAGECOUNT': '2.400'} +[2023-09-14 12:39:11,854][75253] DAMAGECOUNT value on done: 225.0 +[2023-09-14 12:39:11,854][75253] DAMAGECOUNT value on done: 130.0 +[2023-09-14 12:39:11,855][75253] Sum rewards: 2.618, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.050', 'AMMO4': '0.098', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon2': '0.124', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.400', 'weapon4': '0.602', 'weapon3': '1.376', 'weapon5': '1.544'} +[2023-09-14 12:39:11,928][75217] DAMAGECOUNT value on done: 160.0 +[2023-09-14 12:39:11,928][75217] DAMAGECOUNT value on done: 342.0 +[2023-09-14 12:39:11,929][75217] Sum rewards: 5.618, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.005', 'AMMO4': '0.025', 'AMMO3': '0.046', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.172', 'WEAPON3': '0.400', 'weapon2': '0.554', 'weapon5': '1.170', 'weapon3': '1.342', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:39:12,030][75214] Updated weights for policy 0, policy_version 1387 (0.0012) +[2023-09-14 12:39:12,431][75217] DAMAGECOUNT value on done: 300.0 +[2023-09-14 12:39:12,431][75217] DAMAGECOUNT value on done: 278.0 +[2023-09-14 12:39:12,432][75217] Sum rewards: 4.174, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.049', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.408', 'weapon5': '0.536', 'weapon4': '0.562', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.140', 'weapon3': '1.824'} +[2023-09-14 12:39:12,432][75217] Sum rewards: 3.761, reward structure: {'HEALTH': '-1.270', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.007', 'AMMO4': '0.012', 'AMMO3': '0.047', 'weapon4': '0.084', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon2': '0.354', 'WEAPON3': '0.400', 'weapon5': '0.412', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon3': '2.262'} +[2023-09-14 12:39:12,491][75253] DAMAGECOUNT value on done: 237.0 +[2023-09-14 12:39:12,492][75253] DAMAGECOUNT value on done: 80.0 +[2023-09-14 12:39:12,704][75209] Updated weights for policy 1, policy_version 671 (0.0013) +[2023-09-14 12:39:13,042][75217] DAMAGECOUNT value on done: 553.0 +[2023-09-14 12:39:13,042][75217] Sum rewards: 7.248, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.015', 'weapon4': '0.062', 'AMMO3': '0.063', 'AMMO4': '0.075', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon2': '0.222', 'WEAPON3': '0.500', 'weapon5': '1.266', 'weapon3': '2.384', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.350'} +[2023-09-14 12:39:13,043][75217] DAMAGECOUNT value on done: 285.0 +[2023-09-14 12:39:13,043][75217] Sum rewards: 3.290, reward structure: {'HEALTH': '-3.200', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.029', 'AMMO3': '0.069', 'AMMO4': '0.144', 'WEAPON4': '0.200', 'weapon4': '0.326', 'WEAPON5': '0.400', 'weapon2': '0.400', 'weapon5': '0.418', 'WEAPON3': '0.600', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150', 'weapon3': '2.734'} +[2023-09-14 12:39:13,327][75252] DAMAGECOUNT value on done: 472.0 +[2023-09-14 12:39:13,328][75252] DAMAGECOUNT value on done: 392.0 +[2023-09-14 12:39:13,328][75252] Sum rewards: 2.383, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.030', 'AMMO4': '0.099', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.388', 'DAMAGECOUNT': '0.550', 'weapon5': '0.616', 'weapon4': '0.772', 'weapon3': '1.304'} +[2023-09-14 12:39:13,835][75252] DAMAGECOUNT value on done: 123.0 +[2023-09-14 12:39:13,835][75252] DAMAGECOUNT value on done: 155.0 +[2023-09-14 12:39:13,836][75252] Sum rewards: 5.263, reward structure: {'HEALTH': '-0.450', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.025', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.123', 'weapon2': '0.148', 'WEAPON3': '0.200', 'weapon4': '0.536', 'weapon3': '0.932', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon5': '1.374'} +[2023-09-14 12:39:14,435][75252] DAMAGECOUNT value on done: 145.0 +[2023-09-14 12:39:14,435][75252] DAMAGECOUNT value on done: 70.0 +[2023-09-14 12:39:14,435][75252] Sum rewards: 6.037, reward structure: {'HEALTH': '-0.050', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'AMMO3': '0.020', 'AMMO4': '0.075', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.412', 'weapon2': '0.504', 'weapon3': '0.990', 'FRAGCOUNT': '1.000', 'weapon5': '1.266', 'DAMAGECOUNT': '1.400'} +[2023-09-14 12:39:15,036][75252] DAMAGECOUNT value on done: 469.0 +[2023-09-14 12:39:15,036][75252] DAMAGECOUNT value on done: 429.0 +[2023-09-14 12:39:15,036][75252] Sum rewards: 7.061, reward structure: {'HEALTH': '-2.600', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO2': '0.013', 'AMMO5': '0.015', 'AMMO4': '0.067', 'AMMO3': '0.071', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon5': '0.542', 'WEAPON3': '0.600', 'weapon4': '0.604', 'weapon3': '2.596', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.650'} +[2023-09-14 12:39:15,037][75252] Sum rewards: 3.641, reward structure: {'HEALTH': '-3.550', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'weapon5': '0.006', 'AMMO5': '0.020', 'weapon2': '0.022', 'AMMO2': '0.043', 'AMMO3': '0.108', 'AMMO4': '0.214', 'weapon4': '0.256', 'WEAPON4': '0.400', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.600', 'weapon3': '3.322'} +[2023-09-14 12:39:15,106][75216] DAMAGECOUNT value on done: 265.0 +[2023-09-14 12:39:15,106][75216] DAMAGECOUNT value on done: 576.0 +[2023-09-14 12:39:15,107][75216] Sum rewards: 3.102, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO5': '0.010', 'AMMO2': '0.029', 'AMMO3': '0.071', 'AMMO4': '0.146', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon4': '0.456', 'WEAPON3': '0.500', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.674', 'weapon5': '1.714'} +[2023-09-14 12:39:15,107][75216] Sum rewards: 6.521, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.025', 'AMMO3': '0.040', 'WEAPON5': '0.100', 'AMMO4': '0.123', 'WEAPON4': '0.200', 'weapon2': '0.262', 'WEAPON3': '0.400', 'weapon4': '0.646', 'weapon5': '0.908', 'weapon3': '1.762', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:39:15,685][75216] DAMAGECOUNT value on done: 550.0 +[2023-09-14 12:39:15,686][75216] Sum rewards: 5.102, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.040', 'AMMO4': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon5': '0.206', 'WEAPON3': '0.400', 'weapon2': '0.660', 'weapon4': '0.706', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.800', 'weapon3': '1.866'} +[2023-09-14 12:39:15,685][75216] DAMAGECOUNT value on done: 421.0 +[2023-09-14 12:39:16,197][75215] DAMAGECOUNT value on done: 205.0 +[2023-09-14 12:39:16,197][75215] Sum rewards: 5.675, reward structure: {'HEALTH': '-0.900', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.424', 'FRAGCOUNT': '1.000', 'weapon3': '1.186', 'DAMAGECOUNT': '1.350', 'weapon5': '2.320'} +[2023-09-14 12:39:16,197][75215] DAMAGECOUNT value on done: 280.0 +[2023-09-14 12:39:16,249][75216] DAMAGECOUNT value on done: 158.0 +[2023-09-14 12:39:16,250][75216] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:39:16,250][75216] Sum rewards: 2.839, reward structure: {'HEALTH': '-1.180', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'weapon2': '0.066', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.454', 'DAMAGECOUNT': '0.500', 'weapon5': '0.922', 'weapon3': '2.230'} +[2023-09-14 12:39:16,619][109198] Fps is (10 sec: 13926.3, 60 sec: 14540.8, 300 sec: 13205.5). Total num frames: 8482816. Throughput: 0: 1791.3, 1: 1851.4. Samples: 408795. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:39:16,620][109198] Avg episode reward: [(0, '4.011'), (1, '2.911')] +[2023-09-14 12:39:16,640][75052] Saving new best policy, reward=2.911! +[2023-09-14 12:39:16,745][75254] DAMAGECOUNT value on done: 248.0 +[2023-09-14 12:39:16,745][75254] DAMAGECOUNT value on done: 56.0 +[2023-09-14 12:39:16,745][75254] Sum rewards: 3.601, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.010', 'AMMO3': '0.030', 'AMMO4': '0.050', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.402', 'weapon4': '0.494', 'weapon5': '0.536', 'FRAGCOUNT': '0.999', 'weapon3': '1.226', 'DAMAGECOUNT': '1.250'} +[2023-09-14 12:39:16,766][75215] DAMAGECOUNT value on done: 127.0 +[2023-09-14 12:39:16,767][75215] DAMAGECOUNT value on done: 77.0 +[2023-09-14 12:39:16,767][75215] Sum rewards: 2.221, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'DAMAGECOUNT': '0.020', 'AMMO2': '0.020', 'AMMO3': '0.056', 'AMMO4': '0.100', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon2': '0.220', 'WEAPON3': '0.400', 'weapon4': '0.610', 'weapon3': '0.974', 'weapon5': '1.412'} +[2023-09-14 12:39:16,840][75216] DAMAGECOUNT value on done: 315.0 +[2023-09-14 12:39:16,841][75216] DAMAGECOUNT value on done: 429.0 +[2023-09-14 12:39:16,841][75216] Sum rewards: 7.855, reward structure: {'HEALTH': '-0.900', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'weapon2': '0.054', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.342', 'weapon3': '1.224', 'FRAGCOUNT': '2.000', 'weapon5': '2.230', 'DAMAGECOUNT': '2.450'} +[2023-09-14 12:39:17,321][75254] DAMAGECOUNT value on done: 373.0 +[2023-09-14 12:39:17,321][75254] DAMAGECOUNT value on done: 440.0 +[2023-09-14 12:39:17,882][75254] DAMAGECOUNT value on done: 195.0 +[2023-09-14 12:39:17,882][75254] DAMAGECOUNT value on done: 575.0 +[2023-09-14 12:39:17,883][75254] Sum rewards: 1.709, reward structure: {'HEALTH': '-2.250', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.004', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO4': '0.025', 'AMMO3': '0.055', 'weapon5': '0.076', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon4': '0.492', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.696', 'DAMAGECOUNT': '1.800'} +[2023-09-14 12:39:17,883][75254] Sum rewards: 6.174, reward structure: {'HEALTH': '-1.750', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.020', 'AMMO2': '-0.004', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.039', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.224', 'weapon2': '0.316', 'WEAPON3': '0.400', 'weapon5': '1.028', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.300', 'weapon3': '2.330'} +[2023-09-14 12:39:18,029][75214] Updated weights for policy 0, policy_version 1397 (0.0012) +[2023-09-14 12:39:18,462][75254] DAMAGECOUNT value on done: 225.0 +[2023-09-14 12:39:18,462][75254] DAMAGECOUNT value on done: 330.0 +[2023-09-14 12:39:18,463][75254] Sum rewards: 5.493, reward structure: {'HEALTH': '-0.200', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.358', 'FRAGCOUNT': '1.000', 'weapon5': '1.090', 'weapon3': '1.252', 'DAMAGECOUNT': '1.700'} +[2023-09-14 12:39:18,552][75209] Updated weights for policy 1, policy_version 681 (0.0012) +[2023-09-14 12:39:21,619][109198] Fps is (10 sec: 13926.4, 60 sec: 14609.1, 300 sec: 13264.7). Total num frames: 8556544. Throughput: 0: 1814.5, 1: 1839.4. Samples: 424065. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:39:21,620][109198] Avg episode reward: [(0, '4.041'), (1, '2.891')] +[2023-09-14 12:39:23,946][75214] Updated weights for policy 0, policy_version 1407 (0.0012) +[2023-09-14 12:39:24,545][75209] Updated weights for policy 1, policy_version 691 (0.0011) +[2023-09-14 12:39:26,619][109198] Fps is (10 sec: 13926.4, 60 sec: 14404.3, 300 sec: 13258.9). Total num frames: 8622080. Throughput: 0: 1815.4, 1: 1814.5. Samples: 444428. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:39:26,620][109198] Avg episode reward: [(0, '4.041'), (1, '2.891')] +[2023-09-14 12:39:30,031][75214] Updated weights for policy 0, policy_version 1417 (0.0013) +[2023-09-14 12:39:30,421][75209] Updated weights for policy 1, policy_version 701 (0.0011) +[2023-09-14 12:39:31,619][109198] Fps is (10 sec: 13516.8, 60 sec: 14404.3, 300 sec: 13282.7). Total num frames: 8691712. Throughput: 0: 1811.5, 1: 1804.9. Samples: 459875. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:39:31,620][109198] Avg episode reward: [(0, '4.041'), (1, '2.891')] +[2023-09-14 12:39:35,420][75214] Updated weights for policy 0, policy_version 1427 (0.0016) +[2023-09-14 12:39:35,924][75209] Updated weights for policy 1, policy_version 711 (0.0013) +[2023-09-14 12:39:36,619][109198] Fps is (10 sec: 14336.0, 60 sec: 14472.5, 300 sec: 13333.2). Total num frames: 8765440. Throughput: 0: 1815.7, 1: 1814.0. Samples: 476554. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:39:36,620][109198] Avg episode reward: [(0, '4.041'), (1, '2.891')] +[2023-09-14 12:39:41,167][75214] Updated weights for policy 0, policy_version 1437 (0.0011) +[2023-09-14 12:39:41,619][109198] Fps is (10 sec: 14336.1, 60 sec: 14404.3, 300 sec: 13353.0). Total num frames: 8835072. Throughput: 0: 1799.6, 1: 1799.2. Samples: 497996. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:39:41,620][109198] Avg episode reward: [(0, '4.041'), (1, '2.891')] +[2023-09-14 12:39:41,809][75209] Updated weights for policy 1, policy_version 721 (0.0012) +[2023-09-14 12:39:42,740][109198] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 109198], exiting... +[2023-09-14 12:39:42,741][74942] Stopping Batcher_0... +[2023-09-14 12:39:42,742][75052] Stopping Batcher_1... +[2023-09-14 12:39:42,742][74942] Loop batcher_evt_loop terminating... +[2023-09-14 12:39:42,742][109198] Runner profile tree view: +main_loop: 158.9516 +[2023-09-14 12:39:42,743][74942] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001439_5894144.pth... +[2023-09-14 12:39:42,743][75052] Loop batcher_evt_loop terminating... +[2023-09-14 12:39:42,743][109198] Collected {0: 5894144, 1: 2957312}, FPS: 12704.0 +[2023-09-14 12:39:42,744][75052] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000722_2957312.pth... +[2023-09-14 12:39:42,759][75209] Weights refcount: 2 0 +[2023-09-14 12:39:42,760][75209] Stopping InferenceWorker_p1-w0... +[2023-09-14 12:39:42,761][75209] Loop inference_proc1-0_evt_loop terminating... +[2023-09-14 12:39:42,762][75214] Weights refcount: 2 0 +[2023-09-14 12:39:42,763][75214] Stopping InferenceWorker_p0-w0... +[2023-09-14 12:39:42,763][75214] Loop inference_proc0-0_evt_loop terminating... +[2023-09-14 12:39:42,802][74942] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001187_4861952.pth +[2023-09-14 12:39:42,803][75052] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000481_1970176.pth +[2023-09-14 12:39:42,809][74942] Stopping LearnerWorker_p0... +[2023-09-14 12:39:42,809][74942] Loop learner_proc0_evt_loop terminating... +[2023-09-14 12:39:42,810][75052] Stopping LearnerWorker_p1... +[2023-09-14 12:39:42,810][75052] Loop learner_proc1_evt_loop terminating... +[2023-09-14 12:39:43,547][75254] Stopping RolloutWorker_w7... +[2023-09-14 12:39:43,547][75215] Stopping RolloutWorker_w1... +[2023-09-14 12:39:43,548][75215] Loop rollout_proc1_evt_loop terminating... +[2023-09-14 12:39:43,548][75254] Loop rollout_proc7_evt_loop terminating... +[2023-09-14 12:39:43,549][75218] Stopping RolloutWorker_w3... +[2023-09-14 12:39:43,550][75218] Loop rollout_proc3_evt_loop terminating... +[2023-09-14 12:39:43,550][75253] Stopping RolloutWorker_w6... +[2023-09-14 12:39:43,551][75253] Loop rollout_proc6_evt_loop terminating... +[2023-09-14 12:39:43,553][75252] Stopping RolloutWorker_w5... +[2023-09-14 12:39:43,554][75252] Loop rollout_proc5_evt_loop terminating... +[2023-09-14 12:39:43,554][75219] Stopping RolloutWorker_w4... +[2023-09-14 12:39:43,556][75219] Loop rollout_proc4_evt_loop terminating... +[2023-09-14 12:39:43,558][75217] Stopping RolloutWorker_w2... +[2023-09-14 12:39:43,558][75217] Loop rollout_proc2_evt_loop terminating... +[2023-09-14 12:39:43,569][75216] Stopping RolloutWorker_w0... +[2023-09-14 12:39:43,570][75216] Loop rollout_proc0_evt_loop terminating... +[2023-09-14 12:41:42,872][109198] Environment doom_basic already registered, overwriting... +[2023-09-14 12:41:42,875][109198] Environment doom_two_colors_easy already registered, overwriting... +[2023-09-14 12:41:42,877][109198] Environment doom_two_colors_hard already registered, overwriting... +[2023-09-14 12:41:42,878][109198] Environment doom_dm already registered, overwriting... +[2023-09-14 12:41:42,879][109198] Environment doom_dwango5 already registered, overwriting... +[2023-09-14 12:41:42,880][109198] Environment doom_my_way_home_flat_actions already registered, overwriting... +[2023-09-14 12:41:42,881][109198] Environment doom_defend_the_center_flat_actions already registered, overwriting... +[2023-09-14 12:41:42,882][109198] Environment doom_my_way_home already registered, overwriting... +[2023-09-14 12:41:42,884][109198] Environment doom_deadly_corridor already registered, overwriting... +[2023-09-14 12:41:42,886][109198] Environment doom_defend_the_center already registered, overwriting... +[2023-09-14 12:41:42,887][109198] Environment doom_defend_the_line already registered, overwriting... +[2023-09-14 12:41:42,889][109198] Environment doom_health_gathering already registered, overwriting... +[2023-09-14 12:41:42,890][109198] Environment doom_health_gathering_supreme already registered, overwriting... +[2023-09-14 12:41:42,891][109198] Environment doom_battle already registered, overwriting... +[2023-09-14 12:41:42,893][109198] Environment doom_battle2 already registered, overwriting... +[2023-09-14 12:41:42,894][109198] Environment doom_duel_bots already registered, overwriting... +[2023-09-14 12:41:42,895][109198] Environment doom_deathmatch_bots already registered, overwriting... +[2023-09-14 12:41:42,897][109198] Environment doom_duel already registered, overwriting... +[2023-09-14 12:41:42,897][109198] Environment doom_deathmatch_full already registered, overwriting... +[2023-09-14 12:41:42,898][109198] Environment doom_benchmark already registered, overwriting... +[2023-09-14 12:41:42,899][109198] register_encoder_factory: +[2023-09-14 12:41:42,922][109198] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json +[2023-09-14 12:41:42,926][109198] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists! +[2023-09-14 12:41:42,927][109198] Resuming existing experiment from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment... +[2023-09-14 12:41:42,928][109198] Weights and Biases integration disabled +[2023-09-14 12:41:42,931][109198] Environment var CUDA_VISIBLE_DEVICES is 0,1 + +[2023-09-14 12:41:45,144][109198] Starting experiment with the following configuration: +help=False +algo=APPO +env=doom_duel +experiment=default_experiment +train_dir=/home/cogstack/Documents/optuna/environments/sample_factory/train_dir +restart_behavior=resume +device=gpu +seed=None +num_policies=2 +async_rl=True +serial_mode=False +batched_sampling=False +num_batches_to_accumulate=2 +worker_num_splits=2 +policy_workers_per_policy=1 +max_policy_lag=1000 +num_workers=8 +num_envs_per_worker=4 +batch_size=1024 +num_batches_per_epoch=1 +num_epochs=1 +rollout=32 +recurrence=32 +shuffle_minibatches=False +gamma=0.99 +reward_scale=1.0 +reward_clip=1000.0 +value_bootstrap=False +normalize_returns=True +exploration_loss_coeff=0.001 +value_loss_coeff=0.5 +kl_loss_coeff=0.0 +exploration_loss=symmetric_kl +gae_lambda=0.95 +ppo_clip_ratio=0.1 +ppo_clip_value=0.2 +with_vtrace=False +vtrace_rho=1.0 +vtrace_c=1.0 +optimizer=adam +adam_eps=1e-06 +adam_beta1=0.9 +adam_beta2=0.999 +max_grad_norm=4.0 +learning_rate=0.0001 +lr_schedule=constant +lr_schedule_kl_threshold=0.008 +lr_adaptive_min=1e-06 +lr_adaptive_max=0.01 +obs_subtract_mean=0.0 +obs_scale=255.0 +normalize_input=True +normalize_input_keys=None +decorrelate_experience_max_seconds=0 +decorrelate_envs_on_one_worker=True +actor_worker_gpus=[] +set_workers_cpu_affinity=True +force_envs_single_thread=False +default_niceness=0 +log_to_file=True +experiment_summaries_interval=10 +flush_summaries_interval=30 +stats_avg=100 +summaries_use_frameskip=True +heartbeat_interval=20 +heartbeat_reporting_interval=600 +train_for_env_steps=10000000 +train_for_seconds=10000000000 +save_every_sec=120 +keep_checkpoints=2 +load_checkpoint_kind=latest +save_milestones_sec=-1 +save_best_every_sec=5 +save_best_metric=reward +save_best_after=100000 +benchmark=False +encoder_mlp_layers=[512, 512] +encoder_conv_architecture=convnet_simple +encoder_conv_mlp_layers=[512] +use_rnn=True +rnn_size=512 +rnn_type=gru +rnn_num_layers=1 +decoder_mlp_layers=[] +nonlinearity=elu +policy_initialization=orthogonal +policy_init_gain=1.0 +actor_critic_share_weights=True +adaptive_stddev=True +continuous_tanh_scale=0.0 +initial_stddev=1.0 +use_env_info_cache=False +env_gpu_actions=False +env_gpu_observations=True +env_frameskip=4 +env_framestack=1 +pixel_format=CHW +use_record_episode_statistics=False +with_wandb=False +wandb_user=None +wandb_project=sample_factory +wandb_group=None +wandb_job_type=SF +wandb_tags=[] +with_pbt=False +pbt_mix_policies_in_one_env=True +pbt_period_env_steps=5000000 +pbt_start_mutation=20000000 +pbt_replace_fraction=0.3 +pbt_mutation_rate=0.15 +pbt_replace_reward_gap=0.1 +pbt_replace_reward_gap_absolute=1e-06 +pbt_optimize_gamma=False +pbt_target_objective=true_objective +pbt_perturb_min=1.1 +pbt_perturb_max=1.5 +num_agents=-1 +num_humans=0 +num_bots=-1 +start_bot_difficulty=None +timelimit=None +res_w=128 +res_h=72 +wide_aspect_ratio=False +eval_env_frameskip=1 +fps=35 +command_line=--env=doom_dm --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=20000000 +cli_args={'env': 'doom_dm', 'num_workers': 8, 'num_envs_per_worker': 4, 'train_for_env_steps': 20000000} +git_hash=20b6d44612dad7d171f23e13b1f3b4c5e5631cf9 +git_repo_name=https://github.com/MattStammers/optuna.git +[2023-09-14 12:41:45,147][109198] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... +[2023-09-14 12:41:45,268][109198] Rollout worker 0 uses device cpu +[2023-09-14 12:41:45,270][109198] Rollout worker 1 uses device cpu +[2023-09-14 12:41:45,272][109198] Rollout worker 2 uses device cpu +[2023-09-14 12:41:45,275][109198] Rollout worker 3 uses device cpu +[2023-09-14 12:41:45,277][109198] Rollout worker 4 uses device cpu +[2023-09-14 12:41:45,278][109198] Rollout worker 5 uses device cpu +[2023-09-14 12:41:45,282][109198] Rollout worker 6 uses device cpu +[2023-09-14 12:41:45,287][109198] Rollout worker 7 uses device cpu +[2023-09-14 12:41:45,377][109198] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:41:45,378][109198] InferenceWorker_p0-w0: min num requests: 1 +[2023-09-14 12:41:45,383][109198] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:41:45,384][109198] InferenceWorker_p1-w0: min num requests: 1 +[2023-09-14 12:41:45,415][109198] Starting all processes... +[2023-09-14 12:41:45,416][109198] Starting process learner_proc0 +[2023-09-14 12:41:46,975][109198] Starting process learner_proc1 +[2023-09-14 12:41:46,977][93585] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:41:46,977][93585] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 +[2023-09-14 12:41:47,016][93585] Num visible devices: 1 +[2023-09-14 12:41:47,057][93585] Starting seed is not provided +[2023-09-14 12:41:47,057][93585] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:41:47,057][93585] Initializing actor-critic model on device cuda:0 +[2023-09-14 12:41:47,058][93585] RunningMeanStd input shape: (23,) +[2023-09-14 12:41:47,059][93585] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:41:47,059][93585] RunningMeanStd input shape: (1,) +[2023-09-14 12:41:47,078][93585] ConvEncoder: input_channels=3 +[2023-09-14 12:41:47,242][93585] Conv encoder output size: 512 +[2023-09-14 12:41:47,243][93585] Policy head output size: 640 +[2023-09-14 12:41:47,261][93585] Created Actor Critic model with architecture: +[2023-09-14 12:41:47,262][93585] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (measurements): RunningMeanStdInPlace() + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): VizdoomEncoder( + (basic_encoder): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ELU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ELU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ELU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ELU) + ) + ) + ) + (measurements_head): Sequential( + (0): Linear(in_features=23, out_features=128, bias=True) + (1): ELU(alpha=1.0) + (2): Linear(in_features=128, out_features=128, bias=True) + (3): ELU(alpha=1.0) + ) + ) + (core): ModelCoreRNN( + (core): GRU(640, 512) + ) + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=41, bias=True) + ) +) +[2023-09-14 12:41:48,157][93585] Using optimizer +[2023-09-14 12:41:48,158][93585] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001439_5894144.pth... +[2023-09-14 12:41:48,186][93585] Loading model from checkpoint +[2023-09-14 12:41:48,191][93585] Loaded experiment state at self.train_step=1439, self.env_steps=5894144 +[2023-09-14 12:41:48,192][93585] Initialized policy 0 weights for model version 1439 +[2023-09-14 12:41:48,193][93585] LearnerWorker_p0 finished initialization! +[2023-09-14 12:41:48,194][93585] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:41:48,678][93674] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:41:48,679][93674] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for learning process 1 +[2023-09-14 12:41:48,677][109198] Starting all processes... +[2023-09-14 12:41:48,684][109198] Starting process inference_proc0-0 +[2023-09-14 12:41:48,685][109198] Starting process inference_proc1-0 +[2023-09-14 12:41:48,685][109198] Starting process rollout_proc0 +[2023-09-14 12:41:48,685][109198] Starting process rollout_proc1 +[2023-09-14 12:41:48,719][93674] Num visible devices: 1 +[2023-09-14 12:41:48,686][109198] Starting process rollout_proc2 +[2023-09-14 12:41:48,686][109198] Starting process rollout_proc3 +[2023-09-14 12:41:48,688][109198] Starting process rollout_proc4 +[2023-09-14 12:41:48,689][109198] Starting process rollout_proc5 +[2023-09-14 12:41:48,761][93674] Starting seed is not provided +[2023-09-14 12:41:48,762][93674] Using GPUs [0] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:41:48,762][93674] Initializing actor-critic model on device cuda:0 +[2023-09-14 12:41:48,762][93674] RunningMeanStd input shape: (23,) +[2023-09-14 12:41:48,762][93674] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:41:48,763][93674] RunningMeanStd input shape: (1,) +[2023-09-14 12:41:48,690][109198] Starting process rollout_proc6 +[2023-09-14 12:41:48,690][109198] Starting process rollout_proc7 +[2023-09-14 12:41:48,778][93674] ConvEncoder: input_channels=3 +[2023-09-14 12:41:49,018][93674] Conv encoder output size: 512 +[2023-09-14 12:41:49,019][93674] Policy head output size: 640 +[2023-09-14 12:41:49,037][93674] Created Actor Critic model with architecture: +[2023-09-14 12:41:49,037][93674] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (measurements): RunningMeanStdInPlace() + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): VizdoomEncoder( + (basic_encoder): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ELU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ELU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ELU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ELU) + ) + ) + ) + (measurements_head): Sequential( + (0): Linear(in_features=23, out_features=128, bias=True) + (1): ELU(alpha=1.0) + (2): Linear(in_features=128, out_features=128, bias=True) + (3): ELU(alpha=1.0) + ) + ) + (core): ModelCoreRNN( + (core): GRU(640, 512) + ) + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=41, bias=True) + ) +) +[2023-09-14 12:41:50,182][93674] Using optimizer +[2023-09-14 12:41:50,183][93674] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000722_2957312.pth... +[2023-09-14 12:41:50,214][93674] Loading model from checkpoint +[2023-09-14 12:41:50,219][93674] Loaded experiment state at self.train_step=722, self.env_steps=2957312 +[2023-09-14 12:41:50,220][93674] Initialized policy 1 weights for model version 722 +[2023-09-14 12:41:50,222][93674] LearnerWorker_p1 finished initialization! +[2023-09-14 12:41:50,222][93674] Using GPUs [0] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:41:50,701][93835] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:41:50,701][93835] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 +[2023-09-14 12:41:50,715][93836] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:41:50,715][93836] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for inference process 1 +[2023-09-14 12:41:50,733][93836] Num visible devices: 1 +[2023-09-14 12:41:50,735][93873] Worker 4 uses CPU cores [16, 17, 18, 19] +[2023-09-14 12:41:50,737][93835] Num visible devices: 1 +[2023-09-14 12:41:50,741][93837] Worker 0 uses CPU cores [0, 1, 2, 3] +[2023-09-14 12:41:50,759][93874] Worker 5 uses CPU cores [20, 21, 22, 23] +[2023-09-14 12:41:50,783][93839] Worker 2 uses CPU cores [8, 9, 10, 11] +[2023-09-14 12:41:50,855][93871] Worker 3 uses CPU cores [12, 13, 14, 15] +[2023-09-14 12:41:50,866][93906] Worker 6 uses CPU cores [24, 25, 26, 27] +[2023-09-14 12:41:50,894][93838] Worker 1 uses CPU cores [4, 5, 6, 7] +[2023-09-14 12:41:50,920][93987] Worker 7 uses CPU cores [28, 29, 30, 31] +[2023-09-14 12:41:51,522][93835] RunningMeanStd input shape: (23,) +[2023-09-14 12:41:51,523][93835] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:41:51,523][93835] RunningMeanStd input shape: (1,) +[2023-09-14 12:41:51,527][93836] RunningMeanStd input shape: (23,) +[2023-09-14 12:41:51,527][93836] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:41:51,527][93836] RunningMeanStd input shape: (1,) +[2023-09-14 12:41:51,535][93835] ConvEncoder: input_channels=3 +[2023-09-14 12:41:51,539][93836] ConvEncoder: input_channels=3 +[2023-09-14 12:41:51,640][93835] Conv encoder output size: 512 +[2023-09-14 12:41:51,641][93835] Policy head output size: 640 +[2023-09-14 12:41:51,642][93836] Conv encoder output size: 512 +[2023-09-14 12:41:51,644][93836] Policy head output size: 640 +[2023-09-14 12:41:51,929][109198] Inference worker 0-0 is ready! +[2023-09-14 12:41:51,937][109198] Inference worker 1-0 is ready! +[2023-09-14 12:41:51,939][109198] All inference workers are ready! Signal rollout workers to start! +[2023-09-14 12:41:51,944][93874] Multi agent env, num agents: 2 +[2023-09-14 12:41:51,944][93838] Multi agent env, num agents: 2 +[2023-09-14 12:41:51,944][93873] Multi agent env, num agents: 2 +[2023-09-14 12:41:51,946][93906] Multi agent env, num agents: 2 +[2023-09-14 12:41:51,946][93837] Multi agent env, num agents: 2 +[2023-09-14 12:41:51,946][93839] Multi agent env, num agents: 2 +[2023-09-14 12:41:51,948][93987] Multi agent env, num agents: 2 +[2023-09-14 12:41:51,948][93871] Multi agent env, num agents: 2 +[2023-09-14 12:41:51,973][93874] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:41:51,976][93874] Multi agent env, num agents: 2 +[2023-09-14 12:41:51,977][93837] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:41:51,978][93906] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:41:51,979][93839] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:41:51,980][93837] Multi agent env, num agents: 2 +[2023-09-14 12:41:51,981][93906] Multi agent env, num agents: 2 +[2023-09-14 12:41:51,981][93839] Multi agent env, num agents: 2 +[2023-09-14 12:41:51,990][93873] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:41:51,990][93838] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:41:51,994][93873] Multi agent env, num agents: 2 +[2023-09-14 12:41:51,995][93838] Multi agent env, num agents: 2 +[2023-09-14 12:41:51,998][93871] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:41:51,998][93987] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:41:52,003][93987] Multi agent env, num agents: 2 +[2023-09-14 12:41:52,003][93871] Multi agent env, num agents: 2 +[2023-09-14 12:41:52,005][93874] Port 40800 is available +[2023-09-14 12:41:52,005][93874] Using port 40800 +[2023-09-14 12:41:52,006][93874] Initializing env for player 0, init_info: {'port': 40800}... +[2023-09-14 12:41:52,011][93906] Port 40900 is available +[2023-09-14 12:41:52,011][93906] Using port 40900 +[2023-09-14 12:41:52,011][93837] Port 40300 is available +[2023-09-14 12:41:52,011][93837] Using port 40300 +[2023-09-14 12:41:52,012][93839] Port 40500 is available +[2023-09-14 12:41:52,012][93839] Using port 40500 +[2023-09-14 12:41:52,012][93906] Initializing env for player 0, init_info: {'port': 40900}... +[2023-09-14 12:41:52,012][93837] Initializing env for player 0, init_info: {'port': 40300}... +[2023-09-14 12:41:52,013][93839] Initializing env for player 0, init_info: {'port': 40500}... +[2023-09-14 12:41:52,038][93873] Port 40700 is available +[2023-09-14 12:41:52,039][93873] Using port 40700 +[2023-09-14 12:41:52,040][93874] Using port 40800 on host... +[2023-09-14 12:41:52,040][93873] Initializing env for player 0, init_info: {'port': 40700}... +[2023-09-14 12:41:52,042][93839] Using port 40500 on host... +[2023-09-14 12:41:52,042][93906] Using port 40900 on host... +[2023-09-14 12:41:52,043][93838] Port 40400 is available +[2023-09-14 12:41:52,043][93838] Using port 40400 +[2023-09-14 12:41:52,044][93838] Initializing env for player 0, init_info: {'port': 40400}... +[2023-09-14 12:41:52,051][93987] UDP port 41000 cannot be used [Errno 98] Address already in use +[2023-09-14 12:41:52,051][93837] Using port 40300 on host... +[2023-09-14 12:41:52,051][93987] Port 42000 is available +[2023-09-14 12:41:52,052][93987] Using port 42000 +[2023-09-14 12:41:52,052][93871] Port 40600 is available +[2023-09-14 12:41:52,052][93871] Using port 40600 +[2023-09-14 12:41:52,053][93987] Initializing env for player 0, init_info: {'port': 42000}... +[2023-09-14 12:41:52,057][93874] Initializing env for player 1, init_info: {'port': 40800}... +[2023-09-14 12:41:52,063][93906] Initializing env for player 1, init_info: {'port': 40900}... +[2023-09-14 12:41:52,063][93837] Initializing env for player 1, init_info: {'port': 40300}... +[2023-09-14 12:41:52,063][93839] Initializing env for player 1, init_info: {'port': 40500}... +[2023-09-14 12:41:52,085][93873] Using port 40700 on host... +[2023-09-14 12:41:52,087][93987] Using port 42000 on host... +[2023-09-14 12:41:52,089][93838] Using port 40400 on host... +[2023-09-14 12:41:52,094][93873] Initializing env for player 1, init_info: {'port': 40700}... +[2023-09-14 12:41:52,098][93838] Initializing env for player 1, init_info: {'port': 40400}... +[2023-09-14 12:41:52,103][93987] Initializing env for player 1, init_info: {'port': 42000}... +[2023-09-14 12:41:52,931][109198] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 8851456. Throughput: 0: nan, 1: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:41:53,185][93906] Initialized w:6 v:0 player:0 +[2023-09-14 12:41:53,186][93906] Initialized w:6 v:0 player:1 +[2023-09-14 12:41:53,187][93906] 2 agent workers initialized for env 6! +[2023-09-14 12:41:53,195][93906] Decorrelating experience for 0 frames... +[2023-09-14 12:41:53,195][93906] Port 40901 is available +[2023-09-14 12:41:53,195][93906] Using port 40901 +[2023-09-14 12:41:53,227][93987] Initialized w:7 v:0 player:1 +[2023-09-14 12:41:53,227][93987] Initialized w:7 v:0 player:0 +[2023-09-14 12:41:53,227][93874] Initialized w:5 v:0 player:1 +[2023-09-14 12:41:53,228][93987] 2 agent workers initialized for env 7! +[2023-09-14 12:41:53,228][93874] Initialized w:5 v:0 player:0 +[2023-09-14 12:41:53,229][93874] 2 agent workers initialized for env 5! +[2023-09-14 12:41:53,235][93837] Initialized w:0 v:0 player:1 +[2023-09-14 12:41:53,235][93837] Initialized w:0 v:0 player:0 +[2023-09-14 12:41:53,237][93837] 2 agent workers initialized for env 0! +[2023-09-14 12:41:53,239][93874] Decorrelating experience for 0 frames... +[2023-09-14 12:41:53,240][93987] Decorrelating experience for 0 frames... +[2023-09-14 12:41:53,241][93987] UDP port 41001 cannot be used [Errno 98] Address already in use +[2023-09-14 12:41:53,241][93987] Port 42001 is available +[2023-09-14 12:41:53,241][93987] Using port 42001 +[2023-09-14 12:41:53,241][93839] Initialized w:2 v:0 player:1 +[2023-09-14 12:41:53,242][93987] Initializing env for player 0, init_info: {'port': 42001}... +[2023-09-14 12:41:53,242][93839] Initialized w:2 v:0 player:0 +[2023-09-14 12:41:53,243][93874] Port 40801 is available +[2023-09-14 12:41:53,243][93874] Using port 40801 +[2023-09-14 12:41:53,244][93839] 2 agent workers initialized for env 2! +[2023-09-14 12:41:53,246][93837] Decorrelating experience for 0 frames... +[2023-09-14 12:41:53,246][93906] Initializing env for player 0, init_info: {'port': 40901}... +[2023-09-14 12:41:53,247][93837] Port 40301 is available +[2023-09-14 12:41:53,247][93837] Using port 40301 +[2023-09-14 12:41:53,248][93837] Initializing env for player 0, init_info: {'port': 40301}... +[2023-09-14 12:41:53,256][93839] Decorrelating experience for 0 frames... +[2023-09-14 12:41:53,257][93839] Port 40501 is available +[2023-09-14 12:41:53,257][93839] Using port 40501 +[2023-09-14 12:41:53,264][93871] Initializing env for player 0, init_info: {'port': 40600}... +[2023-09-14 12:41:53,269][93873] Initialized w:4 v:0 player:0 +[2023-09-14 12:41:53,270][93873] Initialized w:4 v:0 player:1 +[2023-09-14 12:41:53,271][93873] 2 agent workers initialized for env 4! +[2023-09-14 12:41:53,272][93987] Using port 42001 on host... +[2023-09-14 12:41:53,277][93837] Using port 40301 on host... +[2023-09-14 12:41:53,277][93906] Using port 40901 on host... +[2023-09-14 12:41:53,281][93873] Decorrelating experience for 0 frames... +[2023-09-14 12:41:53,282][93873] Port 40701 is available +[2023-09-14 12:41:53,282][93873] Using port 40701 +[2023-09-14 12:41:53,282][93838] Initialized w:1 v:0 player:0 +[2023-09-14 12:41:53,283][93838] Initialized w:1 v:0 player:1 +[2023-09-14 12:41:53,284][93838] 2 agent workers initialized for env 1! +[2023-09-14 12:41:53,292][93987] Initializing env for player 1, init_info: {'port': 42001}... +[2023-09-14 12:41:53,294][93871] Using port 40600 on host... +[2023-09-14 12:41:53,295][93838] Decorrelating experience for 0 frames... +[2023-09-14 12:41:53,296][93838] Port 40401 is available +[2023-09-14 12:41:53,296][93838] Using port 40401 +[2023-09-14 12:41:53,297][93838] Initializing env for player 0, init_info: {'port': 40401}... +[2023-09-14 12:41:53,297][93906] Initializing env for player 1, init_info: {'port': 40901}... +[2023-09-14 12:41:53,298][93837] Initializing env for player 1, init_info: {'port': 40301}... +[2023-09-14 12:41:53,308][93839] Initializing env for player 0, init_info: {'port': 40501}... +[2023-09-14 12:41:53,315][93871] Initializing env for player 1, init_info: {'port': 40600}... +[2023-09-14 12:41:53,326][93838] Using port 40401 on host... +[2023-09-14 12:41:53,343][93839] Using port 40501 on host... +[2023-09-14 12:41:53,347][93838] Initializing env for player 1, init_info: {'port': 40401}... +[2023-09-14 12:41:53,359][93839] Initializing env for player 1, init_info: {'port': 40501}... +[2023-09-14 12:41:54,315][93837] Initialized w:0 v:1 player:1 +[2023-09-14 12:41:54,316][93837] Initialized w:0 v:1 player:0 +[2023-09-14 12:41:54,318][93837] 2 agent workers initialized for env 0! +[2023-09-14 12:41:54,328][93837] Decorrelating experience for 32 frames... +[2023-09-14 12:41:54,388][93839] Initialized w:2 v:1 player:1 +[2023-09-14 12:41:54,389][93839] Initialized w:2 v:1 player:0 +[2023-09-14 12:41:54,390][93839] 2 agent workers initialized for env 2! +[2023-09-14 12:41:54,398][93839] Decorrelating experience for 32 frames... +[2023-09-14 12:41:54,402][93837] Multi agent env, num agents: 2 +[2023-09-14 12:41:54,408][93906] Initialized w:6 v:1 player:1 +[2023-09-14 12:41:54,409][93906] Initialized w:6 v:1 player:0 +[2023-09-14 12:41:54,410][93906] 2 agent workers initialized for env 6! +[2023-09-14 12:41:54,422][93906] Decorrelating experience for 32 frames... +[2023-09-14 12:41:54,431][93837] Multi agent env, num agents: 2 +[2023-09-14 12:41:54,437][93987] Initialized w:7 v:1 player:1 +[2023-09-14 12:41:54,438][93987] Initialized w:7 v:1 player:0 +[2023-09-14 12:41:54,439][93987] 2 agent workers initialized for env 7! +[2023-09-14 12:41:54,447][93873] Initializing env for player 0, init_info: {'port': 40701}... +[2023-09-14 12:41:54,449][93987] Decorrelating experience for 32 frames... +[2023-09-14 12:41:54,449][93871] Initialized w:3 v:0 player:1 +[2023-09-14 12:41:54,449][93871] Initialized w:3 v:0 player:0 +[2023-09-14 12:41:54,451][93871] 2 agent workers initialized for env 3! +[2023-09-14 12:41:54,462][93871] Decorrelating experience for 0 frames... +[2023-09-14 12:41:54,463][93871] Port 40601 is available +[2023-09-14 12:41:54,463][93871] Using port 40601 +[2023-09-14 12:41:54,463][93871] Initializing env for player 0, init_info: {'port': 40601}... +[2023-09-14 12:41:54,468][93837] Port 40302 is available +[2023-09-14 12:41:54,469][93837] Using port 40302 +[2023-09-14 12:41:54,469][93837] Initializing env for player 0, init_info: {'port': 40302}... +[2023-09-14 12:41:54,479][93839] Multi agent env, num agents: 2 +[2023-09-14 12:41:54,481][93873] Using port 40701 on host... +[2023-09-14 12:41:54,497][93906] Multi agent env, num agents: 2 +[2023-09-14 12:41:54,498][93873] Initializing env for player 1, init_info: {'port': 40701}... +[2023-09-14 12:41:54,501][93838] Initialized w:1 v:1 player:0 +[2023-09-14 12:41:54,502][93838] Initialized w:1 v:1 player:1 +[2023-09-14 12:41:54,503][93838] 2 agent workers initialized for env 1! +[2023-09-14 12:41:54,505][93837] Using port 40302 on host... +[2023-09-14 12:41:54,509][93871] Using port 40601 on host... +[2023-09-14 12:41:54,513][93838] Decorrelating experience for 32 frames... +[2023-09-14 12:41:54,516][93871] Initializing env for player 1, init_info: {'port': 40601}... +[2023-09-14 12:41:54,520][93837] Initializing env for player 1, init_info: {'port': 40302}... +[2023-09-14 12:41:54,525][93839] Multi agent env, num agents: 2 +[2023-09-14 12:41:54,528][93906] Multi agent env, num agents: 2 +[2023-09-14 12:41:54,535][93987] Multi agent env, num agents: 2 +[2023-09-14 12:41:54,558][93906] Port 40902 is available +[2023-09-14 12:41:54,559][93906] Using port 40902 +[2023-09-14 12:41:54,559][93906] Initializing env for player 0, init_info: {'port': 40902}... +[2023-09-14 12:41:54,570][93839] Port 40502 is available +[2023-09-14 12:41:54,570][93839] Using port 40502 +[2023-09-14 12:41:54,571][93839] Initializing env for player 0, init_info: {'port': 40502}... +[2023-09-14 12:41:54,581][93987] Multi agent env, num agents: 2 +[2023-09-14 12:41:54,594][93838] Multi agent env, num agents: 2 +[2023-09-14 12:41:54,599][93906] Using port 40902 on host... +[2023-09-14 12:41:54,611][93839] Using port 40502 on host... +[2023-09-14 12:41:54,612][93906] Initializing env for player 1, init_info: {'port': 40902}... +[2023-09-14 12:41:54,621][93839] Initializing env for player 1, init_info: {'port': 40502}... +[2023-09-14 12:41:54,628][93838] Multi agent env, num agents: 2 +[2023-09-14 12:41:54,631][93987] UDP port 41002 cannot be used [Errno 98] Address already in use +[2023-09-14 12:41:54,631][93987] Port 42002 is available +[2023-09-14 12:41:54,632][93987] Using port 42002 +[2023-09-14 12:41:54,723][93838] Port 40402 is available +[2023-09-14 12:41:54,723][93838] Using port 40402 +[2023-09-14 12:41:54,724][93838] Initializing env for player 0, init_info: {'port': 40402}... +[2023-09-14 12:41:54,759][93838] Using port 40402 on host... +[2023-09-14 12:41:54,775][93838] Initializing env for player 1, init_info: {'port': 40402}... +[2023-09-14 12:41:55,626][93837] Initialized w:0 v:2 player:1 +[2023-09-14 12:41:55,627][93837] Initialized w:0 v:2 player:0 +[2023-09-14 12:41:55,628][93837] 2 agent workers initialized for env 0! +[2023-09-14 12:41:55,636][93837] Decorrelating experience for 64 frames... +[2023-09-14 12:41:55,667][93873] Initialized w:4 v:1 player:1 +[2023-09-14 12:41:55,668][93873] Initialized w:4 v:1 player:0 +[2023-09-14 12:41:55,669][93873] 2 agent workers initialized for env 4! +[2023-09-14 12:41:55,678][93874] Initializing env for player 0, init_info: {'port': 40801}... +[2023-09-14 12:41:55,679][93873] Decorrelating experience for 32 frames... +[2023-09-14 12:41:55,686][93871] Initialized w:3 v:1 player:1 +[2023-09-14 12:41:55,688][93871] Initialized w:3 v:1 player:0 +[2023-09-14 12:41:55,689][93871] 2 agent workers initialized for env 3! +[2023-09-14 12:41:55,699][93871] Decorrelating experience for 32 frames... +[2023-09-14 12:41:55,712][93874] Using port 40801 on host... +[2023-09-14 12:41:55,728][93874] Initializing env for player 1, init_info: {'port': 40801}... +[2023-09-14 12:41:55,765][93873] Multi agent env, num agents: 2 +[2023-09-14 12:41:55,797][93906] Initialized w:6 v:2 player:1 +[2023-09-14 12:41:55,799][93906] Initialized w:6 v:2 player:0 +[2023-09-14 12:41:55,799][93906] 2 agent workers initialized for env 6! +[2023-09-14 12:41:55,801][93871] Multi agent env, num agents: 2 +[2023-09-14 12:41:55,805][93873] Multi agent env, num agents: 2 +[2023-09-14 12:41:55,809][93837] Port 40303 is available +[2023-09-14 12:41:55,809][93837] Using port 40303 +[2023-09-14 12:41:55,810][93837] Initializing env for player 0, init_info: {'port': 40303}... +[2023-09-14 12:41:55,810][93906] Decorrelating experience for 64 frames... +[2023-09-14 12:41:55,827][93839] Initialized w:2 v:2 player:1 +[2023-09-14 12:41:55,828][93839] Initialized w:2 v:2 player:0 +[2023-09-14 12:41:55,829][93839] 2 agent workers initialized for env 2! +[2023-09-14 12:41:55,838][93839] Decorrelating experience for 64 frames... +[2023-09-14 12:41:55,848][93871] Multi agent env, num agents: 2 +[2023-09-14 12:41:55,851][93873] Port 40702 is available +[2023-09-14 12:41:55,852][93873] Using port 40702 +[2023-09-14 12:41:55,852][93873] Initializing env for player 0, init_info: {'port': 40702}... +[2023-09-14 12:41:55,855][93837] Using port 40303 on host... +[2023-09-14 12:41:55,861][93837] Initializing env for player 1, init_info: {'port': 40303}... +[2023-09-14 12:41:55,894][93871] Port 40602 is available +[2023-09-14 12:41:55,894][93871] Using port 40602 +[2023-09-14 12:41:55,894][93871] Initializing env for player 0, init_info: {'port': 40602}... +[2023-09-14 12:41:55,897][93873] Using port 40702 on host... +[2023-09-14 12:41:55,905][93873] Initializing env for player 1, init_info: {'port': 40702}... +[2023-09-14 12:41:55,930][93838] Initialized w:1 v:2 player:1 +[2023-09-14 12:41:55,932][93838] Initialized w:1 v:2 player:0 +[2023-09-14 12:41:55,933][93838] 2 agent workers initialized for env 1! +[2023-09-14 12:41:55,939][93871] Using port 40602 on host... +[2023-09-14 12:41:55,943][93838] Decorrelating experience for 64 frames... +[2023-09-14 12:41:55,945][93871] Initializing env for player 1, init_info: {'port': 40602}... +[2023-09-14 12:41:55,954][93906] Port 40903 is available +[2023-09-14 12:41:55,954][93906] Using port 40903 +[2023-09-14 12:41:55,955][93906] Initializing env for player 0, init_info: {'port': 40903}... +[2023-09-14 12:41:56,000][93906] Using port 40903 on host... +[2023-09-14 12:41:56,001][93839] Port 40503 is available +[2023-09-14 12:41:56,001][93839] Using port 40503 +[2023-09-14 12:41:56,001][93839] Initializing env for player 0, init_info: {'port': 40503}... +[2023-09-14 12:41:56,008][93906] Initializing env for player 1, init_info: {'port': 40903}... +[2023-09-14 12:41:56,031][93839] Using port 40503 on host... +[2023-09-14 12:41:56,052][93839] Initializing env for player 1, init_info: {'port': 40503}... +[2023-09-14 12:41:56,120][93838] Port 40403 is available +[2023-09-14 12:41:56,120][93838] Using port 40403 +[2023-09-14 12:41:56,800][93874] Initialized w:5 v:1 player:0 +[2023-09-14 12:41:56,801][93874] Initialized w:5 v:1 player:1 +[2023-09-14 12:41:56,803][93874] 2 agent workers initialized for env 5! +[2023-09-14 12:41:56,815][93874] Decorrelating experience for 32 frames... +[2023-09-14 12:41:56,818][93987] Initializing env for player 0, init_info: {'port': 42002}... +[2023-09-14 12:41:56,853][93987] Using port 42002 on host... +[2023-09-14 12:41:56,869][93987] Initializing env for player 1, init_info: {'port': 42002}... +[2023-09-14 12:41:56,885][93874] Multi agent env, num agents: 2 +[2023-09-14 12:41:56,931][93874] Multi agent env, num agents: 2 +[2023-09-14 12:41:56,935][93837] Initialized w:0 v:3 player:0 +[2023-09-14 12:41:56,936][93837] Initialized w:0 v:3 player:1 +[2023-09-14 12:41:56,939][93837] 2 agent workers initialized for env 0! +[2023-09-14 12:41:56,953][93837] Decorrelating experience for 96 frames... +[2023-09-14 12:41:56,972][93871] Initialized w:3 v:2 player:0 +[2023-09-14 12:41:56,974][93873] Initialized w:4 v:2 player:0 +[2023-09-14 12:41:56,974][93873] Initialized w:4 v:2 player:1 +[2023-09-14 12:41:56,974][93871] Initialized w:3 v:2 player:1 +[2023-09-14 12:41:56,975][93871] 2 agent workers initialized for env 3! +[2023-09-14 12:41:56,976][93873] 2 agent workers initialized for env 4! +[2023-09-14 12:41:56,984][93873] Decorrelating experience for 64 frames... +[2023-09-14 12:41:56,991][93871] Decorrelating experience for 64 frames... +[2023-09-14 12:41:56,999][93874] Port 40802 is available +[2023-09-14 12:41:56,999][93874] Using port 40802 +[2023-09-14 12:41:57,000][93874] Initializing env for player 0, init_info: {'port': 40802}... +[2023-09-14 12:41:57,033][93874] Using port 40802 on host... +[2023-09-14 12:41:57,050][93874] Initializing env for player 1, init_info: {'port': 40802}... +[2023-09-14 12:41:57,114][93906] Initialized w:6 v:3 player:0 +[2023-09-14 12:41:57,115][93906] Initialized w:6 v:3 player:1 +[2023-09-14 12:41:57,117][93906] 2 agent workers initialized for env 6! +[2023-09-14 12:41:57,128][93906] Decorrelating experience for 96 frames... +[2023-09-14 12:41:57,147][93873] Port 40703 is available +[2023-09-14 12:41:57,148][93873] Using port 40703 +[2023-09-14 12:41:57,148][93873] Initializing env for player 0, init_info: {'port': 40703}... +[2023-09-14 12:41:57,170][93871] Port 40603 is available +[2023-09-14 12:41:57,170][93871] Using port 40603 +[2023-09-14 12:41:57,183][93873] Using port 40703 on host... +[2023-09-14 12:41:57,189][93839] Initialized w:2 v:3 player:0 +[2023-09-14 12:41:57,189][93839] Initialized w:2 v:3 player:1 +[2023-09-14 12:41:57,191][93839] 2 agent workers initialized for env 2! +[2023-09-14 12:41:57,198][93873] Initializing env for player 1, init_info: {'port': 40703}... +[2023-09-14 12:41:57,199][93839] Decorrelating experience for 96 frames... +[2023-09-14 12:41:57,231][93838] Initializing env for player 0, init_info: {'port': 40403}... +[2023-09-14 12:41:57,277][93838] Using port 40403 on host... +[2023-09-14 12:41:57,281][93838] Initializing env for player 1, init_info: {'port': 40403}... +[2023-09-14 12:41:57,931][109198] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 8851456. Throughput: 0: 0.0, 1: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:41:58,026][93987] Initialized w:7 v:2 player:1 +[2023-09-14 12:41:58,027][93987] Initialized w:7 v:2 player:0 +[2023-09-14 12:41:58,030][93987] 2 agent workers initialized for env 7! +[2023-09-14 12:41:58,040][93987] Decorrelating experience for 64 frames... +[2023-09-14 12:41:58,212][93987] Port 41003 is available +[2023-09-14 12:41:58,212][93987] Using port 41003 +[2023-09-14 12:41:58,213][93987] Initializing env for player 0, init_info: {'port': 41003}... +[2023-09-14 12:41:58,215][93873] Initialized w:4 v:3 player:0 +[2023-09-14 12:41:58,215][93873] Initialized w:4 v:3 player:1 +[2023-09-14 12:41:58,217][93873] 2 agent workers initialized for env 4! +[2023-09-14 12:41:58,227][93873] Decorrelating experience for 96 frames... +[2023-09-14 12:41:58,230][93874] Initialized w:5 v:2 player:1 +[2023-09-14 12:41:58,230][93874] Initialized w:5 v:2 player:0 +[2023-09-14 12:41:58,232][93874] 2 agent workers initialized for env 5! +[2023-09-14 12:41:58,244][93874] Decorrelating experience for 64 frames... +[2023-09-14 12:41:58,244][93987] Using port 41003 on host... +[2023-09-14 12:41:58,252][93871] Initializing env for player 0, init_info: {'port': 40603}... +[2023-09-14 12:41:58,263][93987] Initializing env for player 1, init_info: {'port': 41003}... +[2023-09-14 12:41:58,298][93871] Using port 40603 on host... +[2023-09-14 12:41:58,303][93871] Initializing env for player 1, init_info: {'port': 40603}... +[2023-09-14 12:41:58,462][93874] Port 40803 is available +[2023-09-14 12:41:58,462][93874] Using port 40803 +[2023-09-14 12:41:58,463][93874] Initializing env for player 0, init_info: {'port': 40803}... +[2023-09-14 12:41:58,468][93838] Initialized w:1 v:3 player:1 +[2023-09-14 12:41:58,468][93838] Initialized w:1 v:3 player:0 +[2023-09-14 12:41:58,469][93838] 2 agent workers initialized for env 1! +[2023-09-14 12:41:58,480][93838] Decorrelating experience for 96 frames... +[2023-09-14 12:41:58,508][93874] Using port 40803 on host... +[2023-09-14 12:41:58,513][93874] Initializing env for player 1, init_info: {'port': 40803}... +[2023-09-14 12:41:59,430][93987] Initialized w:7 v:3 player:1 +[2023-09-14 12:41:59,432][93987] Initialized w:7 v:3 player:0 +[2023-09-14 12:41:59,432][93987] 2 agent workers initialized for env 7! +[2023-09-14 12:41:59,442][93987] Decorrelating experience for 96 frames... +[2023-09-14 12:41:59,531][93871] Initialized w:3 v:3 player:1 +[2023-09-14 12:41:59,532][93871] Initialized w:3 v:3 player:0 +[2023-09-14 12:41:59,533][93871] 2 agent workers initialized for env 3! +[2023-09-14 12:41:59,543][93871] Decorrelating experience for 96 frames... +[2023-09-14 12:41:59,730][93874] Initialized w:5 v:3 player:1 +[2023-09-14 12:41:59,731][93874] Initialized w:5 v:3 player:0 +[2023-09-14 12:41:59,732][93874] 2 agent workers initialized for env 5! +[2023-09-14 12:41:59,742][93874] Decorrelating experience for 96 frames... +[2023-09-14 12:41:59,950][93585] Signal inference workers to stop experience collection... +[2023-09-14 12:41:59,963][93835] InferenceWorker_p0-w0: stopping experience collection +[2023-09-14 12:41:59,977][93836] InferenceWorker_p1-w0: stopping experience collection +[2023-09-14 12:42:02,412][93585] Signal inference workers to resume experience collection... +[2023-09-14 12:42:02,412][93836] InferenceWorker_p1-w0: resuming experience collection +[2023-09-14 12:42:02,413][93835] InferenceWorker_p0-w0: resuming experience collection +[2023-09-14 12:42:02,931][109198] Fps is (10 sec: 409.6, 60 sec: 409.6, 300 sec: 409.6). Total num frames: 8855552. Throughput: 0: 252.3, 1: 125.5. Samples: 3778. Policy #0 lag: (min: 0.0, avg: 0.0, max: 0.0) +[2023-09-14 12:42:05,363][109198] Heartbeat connected on Batcher_0 +[2023-09-14 12:42:05,366][109198] Heartbeat connected on LearnerWorker_p0 +[2023-09-14 12:42:05,369][109198] Heartbeat connected on Batcher_1 +[2023-09-14 12:42:05,385][109198] Heartbeat connected on InferenceWorker_p0-w0 +[2023-09-14 12:42:05,390][109198] Heartbeat connected on InferenceWorker_p1-w0 +[2023-09-14 12:42:05,400][109198] Heartbeat connected on RolloutWorker_w2 +[2023-09-14 12:42:05,411][109198] Heartbeat connected on RolloutWorker_w3 +[2023-09-14 12:42:05,412][109198] Heartbeat connected on RolloutWorker_w6 +[2023-09-14 12:42:05,413][109198] Heartbeat connected on RolloutWorker_w1 +[2023-09-14 12:42:05,415][109198] Heartbeat connected on RolloutWorker_w0 +[2023-09-14 12:42:05,417][109198] Heartbeat connected on RolloutWorker_w7 +[2023-09-14 12:42:05,418][109198] Heartbeat connected on RolloutWorker_w4 +[2023-09-14 12:42:05,424][109198] Heartbeat connected on RolloutWorker_w5 +[2023-09-14 12:42:05,486][93674] Signal inference workers to stop experience collection... +[2023-09-14 12:42:05,953][93674] Signal inference workers to resume experience collection... +[2023-09-14 12:42:06,386][109198] Heartbeat connected on LearnerWorker_p1 +[2023-09-14 12:42:07,688][93835] Updated weights for policy 0, policy_version 1449 (0.0689) +[2023-09-14 12:42:07,931][109198] Fps is (10 sec: 6144.0, 60 sec: 4096.0, 300 sec: 4096.0). Total num frames: 8912896. Throughput: 0: 641.1, 1: 298.7. Samples: 14096. Policy #0 lag: (min: 0.0, avg: 0.8, max: 3.0) +[2023-09-14 12:42:12,219][93835] Updated weights for policy 0, policy_version 1459 (0.0012) +[2023-09-14 12:42:12,700][93836] Updated weights for policy 1, policy_version 732 (0.0016) +[2023-09-14 12:42:12,931][109198] Fps is (10 sec: 12697.8, 60 sec: 6553.6, 300 sec: 6553.6). Total num frames: 8982528. Throughput: 0: 817.2, 1: 385.8. Samples: 24058. Policy #0 lag: (min: 0.0, avg: 0.9, max: 2.0) +[2023-09-14 12:42:16,467][93835] Updated weights for policy 0, policy_version 1469 (0.0013) +[2023-09-14 12:42:17,931][109198] Fps is (10 sec: 13516.9, 60 sec: 7864.4, 300 sec: 7864.4). Total num frames: 9048064. Throughput: 0: 1212.3, 1: 578.8. Samples: 44778. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:42:20,659][93835] Updated weights for policy 0, policy_version 1479 (0.0011) +[2023-09-14 12:42:21,452][93836] Updated weights for policy 1, policy_version 742 (0.0013) +[2023-09-14 12:42:22,931][109198] Fps is (10 sec: 13926.5, 60 sec: 9011.3, 300 sec: 9011.3). Total num frames: 9121792. Throughput: 0: 1499.1, 1: 711.3. Samples: 66312. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:42:24,815][93835] Updated weights for policy 0, policy_version 1489 (0.0014) +[2023-09-14 12:42:27,931][109198] Fps is (10 sec: 13926.0, 60 sec: 9596.3, 300 sec: 9596.3). Total num frames: 9187328. Throughput: 0: 1495.2, 1: 709.7. Samples: 77173. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:42:29,632][93835] Updated weights for policy 0, policy_version 1499 (0.0014) +[2023-09-14 12:42:31,117][93836] Updated weights for policy 1, policy_version 752 (0.0013) +[2023-09-14 12:42:32,931][109198] Fps is (10 sec: 13107.1, 60 sec: 10035.2, 300 sec: 10035.2). Total num frames: 9252864. Throughput: 0: 1631.7, 1: 774.1. Samples: 96231. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:42:34,332][93835] Updated weights for policy 0, policy_version 1509 (0.0017) +[2023-09-14 12:42:36,849][93906] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:42:36,849][93906] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:42:36,850][93906] Sum rewards: 4.498, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.011', 'AMMO3': '0.052', 'AMMO4': '0.057', 'WEAPON4': '0.100', 'weapon4': '0.118', 'WEAPON5': '0.200', 'weapon2': '0.378', 'WEAPON3': '0.400', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '1.582', 'weapon5': '1.592'} +[2023-09-14 12:42:37,050][93906] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:42:37,460][93906] DAMAGECOUNT value on done: 266.0 +[2023-09-14 12:42:37,460][93906] DAMAGECOUNT value on done: 95.0 +[2023-09-14 12:42:37,461][93906] Sum rewards: 5.313, reward structure: {'HEALTH': '-1.950', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.008', 'AMMO4': '0.022', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.506', 'weapon5': '0.906', 'FRAGCOUNT': '1.000', 'weapon3': '2.516', 'DAMAGECOUNT': '2.660'} +[2023-09-14 12:42:37,461][93906] Sum rewards: -0.428, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.013', 'AMMO5': '0.020', 'weapon5': '0.042', 'AMMO4': '0.064', 'weapon4': '0.072', 'AMMO3': '0.110', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.950', 'weapon2': '1.308', 'weapon3': '1.694'} +[2023-09-14 12:42:37,931][109198] Fps is (10 sec: 12698.0, 60 sec: 10285.5, 300 sec: 10285.5). Total num frames: 9314304. Throughput: 0: 1731.5, 1: 823.1. Samples: 114955. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:42:37,932][109198] Avg episode reward: [(0, '2.348')] +[2023-09-14 12:42:39,001][93873] DAMAGECOUNT value on done: 85.0 +[2023-09-14 12:42:39,002][93873] DAMAGECOUNT value on done: 65.0 +[2023-09-14 12:42:39,332][93835] Updated weights for policy 0, policy_version 1519 (0.0014) +[2023-09-14 12:42:39,679][93873] DAMAGECOUNT value on done: 200.0 +[2023-09-14 12:42:39,679][93873] DAMAGECOUNT value on done: 305.0 +[2023-09-14 12:42:39,680][93873] Sum rewards: 3.145, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'weapon5': '0.042', 'AMMO2': '0.045', 'AMMO3': '0.098', 'AMMO4': '0.227', 'weapon2': '0.268', 'WEAPON4': '0.400', 'WEAPON5': '0.400', 'weapon4': '0.612', 'WEAPON3': '0.700', 'DAMAGECOUNT': '2.000', 'FRAGCOUNT': '2.000', 'weapon3': '2.332'} +[2023-09-14 12:42:39,680][93873] Sum rewards: 6.826, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.020', 'AMMO2': '-0.004', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.070', 'WEAPON4': '0.100', 'weapon4': '0.190', 'WEAPON5': '0.300', 'weapon2': '0.414', 'WEAPON3': '0.600', 'weapon5': '0.688', 'weapon3': '2.422', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.050'} +[2023-09-14 12:42:40,001][93838] DAMAGECOUNT value on done: 220.0 +[2023-09-14 12:42:40,002][93838] DAMAGECOUNT value on done: 120.0 +[2023-09-14 12:42:40,002][93838] Sum rewards: 5.863, reward structure: {'HEALTH': '-1.700', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.010', 'AMMO3': '0.041', 'AMMO4': '0.052', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.230', 'WEAPON3': '0.400', 'weapon4': '0.458', 'weapon5': '0.548', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.200', 'weapon3': '2.216'} +[2023-09-14 12:42:40,008][93839] DAMAGECOUNT value on done: 290.0 +[2023-09-14 12:42:40,008][93839] DAMAGECOUNT value on done: 260.0 +[2023-09-14 12:42:40,009][93839] Sum rewards: 6.109, reward structure: {'HEALTH': '-2.500', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.015', 'AMMO4': '0.025', 'AMMO3': '0.069', 'weapon5': '0.092', 'WEAPON4': '0.200', 'weapon2': '0.296', 'WEAPON5': '0.300', 'weapon4': '0.314', 'WEAPON3': '0.600', 'weapon3': '2.792', 'DAMAGECOUNT': '2.900', 'FRAGCOUNT': '3.000'} +[2023-09-14 12:42:40,010][93839] Sum rewards: 3.465, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.021', 'AMMO3': '0.093', 'AMMO4': '0.104', 'weapon2': '0.218', 'weapon5': '0.220', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.490', 'WEAPON3': '0.700', 'FRAGCOUNT': '2.000', 'weapon3': '2.404', 'DAMAGECOUNT': '2.600'} +[2023-09-14 12:42:40,223][93839] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:42:40,482][93873] DAMAGECOUNT value on done: 20.0 +[2023-09-14 12:42:40,482][93873] DAMAGECOUNT value on done: 65.0 +[2023-09-14 12:42:40,519][93906] DAMAGECOUNT value on done: 30.0 +[2023-09-14 12:42:40,519][93906] DAMAGECOUNT value on done: 20.0 +[2023-09-14 12:42:40,600][93838] DAMAGECOUNT value on done: 210.0 +[2023-09-14 12:42:40,600][93838] DAMAGECOUNT value on done: 210.0 +[2023-09-14 12:42:40,602][93838] Sum rewards: 5.161, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.018', 'AMMO3': '0.081', 'AMMO4': '0.089', 'weapon2': '0.142', 'WEAPON4': '0.200', 'weapon4': '0.272', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon5': '1.076', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100', 'weapon3': '2.268'} +[2023-09-14 12:42:40,602][93838] Sum rewards: 4.536, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.012', 'AMMO3': '0.045', 'AMMO4': '0.060', 'weapon4': '0.098', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.490', 'weapon5': '1.012', 'weapon3': '1.908', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:42:40,628][93839] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:42:40,629][93839] DAMAGECOUNT value on done: 60.0 +[2023-09-14 12:42:40,802][93836] Updated weights for policy 1, policy_version 762 (0.0013) +[2023-09-14 12:42:41,204][93873] DAMAGECOUNT value on done: 130.0 +[2023-09-14 12:42:41,204][93873] Sum rewards: 5.935, reward structure: {'HEALTH': '-0.750', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.025', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.125', 'WEAPON3': '0.200', 'weapon2': '0.454', 'weapon4': '0.598', 'weapon3': '0.806', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.300', 'weapon5': '1.952'} +[2023-09-14 12:42:41,205][93873] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:42:41,292][93906] DAMAGECOUNT value on done: 200.0 +[2023-09-14 12:42:41,292][93906] DAMAGECOUNT value on done: 165.0 +[2023-09-14 12:42:41,293][93906] Sum rewards: 5.203, reward structure: {'HEALTH': '-1.840', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.046', 'weapon4': '0.096', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.622', 'weapon5': '0.652', 'weapon3': '1.920', 'DAMAGECOUNT': '2.000', 'FRAGCOUNT': '2.000'} +[2023-09-14 12:42:41,293][93906] Sum rewards: 2.191, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.025', 'AMMO3': '0.070', 'WEAPON5': '0.100', 'weapon5': '0.114', 'AMMO4': '0.122', 'WEAPON4': '0.200', 'weapon2': '0.412', 'WEAPON3': '0.500', 'weapon4': '0.822', 'FRAGCOUNT': '1.000', 'weapon3': '1.170', 'DAMAGECOUNT': '1.650'} +[2023-09-14 12:42:41,318][93839] DAMAGECOUNT value on done: 14.0 +[2023-09-14 12:42:41,318][93839] DAMAGECOUNT value on done: 30.0 +[2023-09-14 12:42:41,356][93874] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:42:41,357][93874] DAMAGECOUNT value on done: 20.0 +[2023-09-14 12:42:41,491][93873] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:42:42,016][93839] DAMAGECOUNT value on done: 199.0 +[2023-09-14 12:42:42,016][93839] DAMAGECOUNT value on done: 77.0 +[2023-09-14 12:42:42,017][93839] Sum rewards: 5.961, reward structure: {'HEALTH': '-0.770', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.712', 'FRAGCOUNT': '1.000', 'weapon3': '1.150', 'weapon5': '1.554', 'DAMAGECOUNT': '1.990'} +[2023-09-14 12:42:42,110][93874] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:42:42,110][93874] DAMAGECOUNT value on done: 60.0 +[2023-09-14 12:42:42,133][93871] DAMAGECOUNT value on done: 124.0 +[2023-09-14 12:42:42,134][93871] Sum rewards: 3.787, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.024', 'AMMO3': '0.051', 'weapon2': '0.092', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.368', 'WEAPON3': '0.400', 'weapon5': '0.746', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.240', 'weapon3': '1.654'} +[2023-09-14 12:42:42,133][93871] DAMAGECOUNT value on done: 130.0 +[2023-09-14 12:42:42,135][93871] Sum rewards: 4.331, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.032', 'AMMO3': '0.050', 'AMMO4': '0.159', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.282', 'weapon5': '0.286', 'WEAPON3': '0.400', 'weapon4': '0.646', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.300', 'weapon3': '1.766'} +[2023-09-14 12:42:42,407][93871] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:42:42,802][93871] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:42:42,803][93871] DAMAGECOUNT value on done: 110.0 +[2023-09-14 12:42:42,803][93871] Sum rewards: 2.779, reward structure: {'HEALTH': '-1.550', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.050', 'weapon2': '0.094', 'WEAPON5': '0.100', 'weapon5': '0.182', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.596', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '1.654'} +[2023-09-14 12:42:42,831][93874] DAMAGECOUNT value on done: 275.0 +[2023-09-14 12:42:42,831][93874] DAMAGECOUNT value on done: 185.0 +[2023-09-14 12:42:42,832][93874] Sum rewards: 5.448, reward structure: {'HEALTH': '-2.200', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO5': '0.015', 'AMMO4': '0.051', 'AMMO3': '0.069', 'weapon5': '0.082', 'weapon2': '0.114', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.472', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.750', 'weapon3': '2.886'} +[2023-09-14 12:42:42,833][93874] Sum rewards: 2.386, reward structure: {'HEALTH': '-2.700', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.025', 'weapon5': '0.036', 'AMMO3': '0.086', 'AMMO4': '0.122', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon2': '0.300', 'weapon4': '0.384', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.850', 'weapon3': '2.068'} +[2023-09-14 12:42:42,931][109198] Fps is (10 sec: 12697.6, 60 sec: 10567.7, 300 sec: 10567.7). Total num frames: 9379840. Throughput: 0: 1865.3, 1: 895.7. Samples: 124246. Policy #0 lag: (min: 0.0, avg: 0.9, max: 2.0) +[2023-09-14 12:42:42,933][109198] Avg episode reward: [(0, '3.641'), (1, '2.921')] +[2023-09-14 12:42:42,937][93674] Saving new best policy, reward=2.921! +[2023-09-14 12:42:43,017][93874] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:42:43,324][93871] DAMAGECOUNT value on done: 76.0 +[2023-09-14 12:42:43,325][93871] DAMAGECOUNT value on done: 212.0 +[2023-09-14 12:42:43,325][93871] Sum rewards: 5.000, reward structure: {'HEALTH': '-0.760', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.050', 'WEAPON4': '0.100', 'weapon2': '0.112', 'WEAPON3': '0.200', 'weapon4': '0.388', 'weapon3': '0.760', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.120'} +[2023-09-14 12:42:43,380][93874] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:42:43,380][93874] DAMAGECOUNT value on done: 60.0 +[2023-09-14 12:42:43,381][93874] Sum rewards: 1.771, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.010', 'AMMO3': '0.046', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.460', 'weapon5': '1.066', 'weapon3': '1.722'} +[2023-09-14 12:42:43,546][93838] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:42:43,546][93838] DAMAGECOUNT value on done: 20.0 +[2023-09-14 12:42:43,608][93837] DAMAGECOUNT value on done: 201.0 +[2023-09-14 12:42:43,609][93837] DAMAGECOUNT value on done: 10.0 +[2023-09-14 12:42:43,609][93837] Sum rewards: 5.045, reward structure: {'HEALTH': '-0.100', 'HITCOUNT': '0.000', 'AMMO3': '0.020', 'AMMO2': '0.030', 'WEAPON4': '0.100', 'AMMO4': '0.149', 'WEAPON3': '0.200', 'weapon2': '0.204', 'weapon3': '0.678', 'weapon4': '0.754', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '2.010'} +[2023-09-14 12:42:43,780][93838] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:42:43,925][93871] DAMAGECOUNT value on done: 20.0 +[2023-09-14 12:42:43,926][93871] DAMAGECOUNT value on done: 30.0 +[2023-09-14 12:42:43,978][93837] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:42:44,138][93838] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:42:44,138][93838] Sum rewards: 0.817, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.013', 'AMMO2': '0.021', 'AMMO3': '0.070', 'weapon5': '0.088', 'AMMO4': '0.104', 'weapon4': '0.140', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon2': '0.456', 'WEAPON3': '0.600', 'weapon3': '2.826'} +[2023-09-14 12:42:44,138][93838] DAMAGECOUNT value on done: 115.0 +[2023-09-14 12:42:44,139][93838] Sum rewards: 4.191, reward structure: {'HITCOUNT': '0.000', 'AMMO2': '0.020', 'AMMO3': '0.020', 'AMMO4': '0.099', 'WEAPON4': '0.100', 'weapon2': '0.194', 'WEAPON3': '0.200', 'weapon4': '0.588', 'weapon3': '0.820', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150'} +[2023-09-14 12:42:44,209][93835] Updated weights for policy 0, policy_version 1529 (0.0013) +[2023-09-14 12:42:44,264][93987] DAMAGECOUNT value on done: 75.0 +[2023-09-14 12:42:44,265][93987] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:42:44,503][93837] DAMAGECOUNT value on done: 30.0 +[2023-09-14 12:42:44,504][93837] DAMAGECOUNT value on done: 30.0 +[2023-09-14 12:42:44,504][93837] Sum rewards: 2.521, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.032', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.300', 'weapon2': '0.378', 'weapon3': '1.632', 'weapon5': '2.000'} +[2023-09-14 12:42:44,522][93987] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:42:44,973][93987] DAMAGECOUNT value on done: 245.0 +[2023-09-14 12:42:44,973][93987] DAMAGECOUNT value on done: 290.0 +[2023-09-14 12:42:44,974][93987] Sum rewards: 4.662, reward structure: {'HEALTH': '-2.900', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.033', 'AMMO3': '0.072', 'weapon2': '0.104', 'weapon5': '0.126', 'AMMO4': '0.167', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.584', 'WEAPON3': '0.600', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.450', 'weapon3': '2.810'} +[2023-09-14 12:42:44,974][93987] Sum rewards: 5.567, reward structure: {'HEALTH': '-2.400', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.015', 'AMMO4': '0.036', 'AMMO3': '0.065', 'WEAPON4': '0.200', 'weapon2': '0.262', 'weapon4': '0.262', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.900', 'weapon3': '3.320'} +[2023-09-14 12:42:45,097][93837] DAMAGECOUNT value on done: 220.0 +[2023-09-14 12:42:45,097][93837] Sum rewards: 5.739, reward structure: {'HEALTH': '-1.950', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.029', 'AMMO3': '0.040', 'AMMO4': '0.143', 'weapon2': '0.170', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.872', 'weapon5': '0.918', 'weapon3': '1.506', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.200'} +[2023-09-14 12:42:45,097][93837] DAMAGECOUNT value on done: 200.0 +[2023-09-14 12:42:45,098][93837] Sum rewards: 3.190, reward structure: {'HEALTH': '-2.150', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.048', 'AMMO3': '0.064', 'WEAPON5': '0.100', 'weapon2': '0.220', 'weapon5': '0.226', 'WEAPON4': '0.300', 'weapon4': '0.586', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '2.000', 'weapon3': '2.180'} +[2023-09-14 12:42:45,655][93987] DAMAGECOUNT value on done: 10.0 +[2023-09-14 12:42:45,655][93987] DAMAGECOUNT value on done: 85.0 +[2023-09-14 12:42:45,837][93837] DAMAGECOUNT value on done: 310.0 +[2023-09-14 12:42:45,837][93837] DAMAGECOUNT value on done: 180.0 +[2023-09-14 12:42:45,838][93837] Sum rewards: 1.975, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.032', 'weapon2': '0.036', 'AMMO3': '0.070', 'AMMO4': '0.158', 'weapon5': '0.176', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon4': '0.460', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.800', 'weapon3': '3.028'} +[2023-09-14 12:42:45,837][93837] Sum rewards: 7.487, reward structure: {'HEALTH': '-1.800', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.014', 'AMMO3': '0.040', 'AMMO4': '0.069', 'weapon5': '0.152', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.412', 'weapon4': '0.532', 'weapon3': '2.158', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.100'} +[2023-09-14 12:42:46,295][93987] DAMAGECOUNT value on done: 327.0 +[2023-09-14 12:42:46,296][93987] DAMAGECOUNT value on done: 300.0 +[2023-09-14 12:42:46,296][93987] Sum rewards: 5.394, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.012', 'AMMO2': '0.030', 'AMMO3': '0.095', 'AMMO4': '0.148', 'weapon2': '0.176', 'weapon5': '0.188', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon4': '0.420', 'WEAPON3': '0.700', 'weapon3': '2.754', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.270'} +[2023-09-14 12:42:46,297][93987] Sum rewards: 5.377, reward structure: {'HEALTH': '-3.120', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.028', 'weapon2': '0.086', 'AMMO3': '0.109', 'AMMO4': '0.138', 'WEAPON4': '0.300', 'weapon5': '0.328', 'WEAPON5': '0.400', 'weapon4': '0.530', 'WEAPON3': '0.800', 'weapon3': '2.758', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.000'} +[2023-09-14 12:42:47,931][109198] Fps is (10 sec: 13107.3, 60 sec: 10798.6, 300 sec: 10798.6). Total num frames: 9445376. Throughput: 0: 2081.4, 1: 1023.3. Samples: 143487. Policy #0 lag: (min: 0.0, avg: 0.8, max: 3.0) +[2023-09-14 12:42:47,932][109198] Avg episode reward: [(0, '3.595'), (1, '3.076')] +[2023-09-14 12:42:47,934][93674] Saving new best policy, reward=3.076! +[2023-09-14 12:42:49,141][93836] Updated weights for policy 1, policy_version 772 (0.0013) +[2023-09-14 12:42:49,288][93835] Updated weights for policy 0, policy_version 1539 (0.0013) +[2023-09-14 12:42:52,931][109198] Fps is (10 sec: 13926.5, 60 sec: 11127.5, 300 sec: 11127.5). Total num frames: 9519104. Throughput: 0: 2204.6, 1: 1126.2. Samples: 163983. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:42:52,932][109198] Avg episode reward: [(0, '3.595'), (1, '3.076')] +[2023-09-14 12:42:53,866][93835] Updated weights for policy 0, policy_version 1549 (0.0014) +[2023-09-14 12:42:56,488][93836] Updated weights for policy 1, policy_version 782 (0.0012) +[2023-09-14 12:42:57,931][109198] Fps is (10 sec: 13926.4, 60 sec: 12219.8, 300 sec: 11279.8). Total num frames: 9584640. Throughput: 0: 2203.5, 1: 1146.3. Samples: 174796. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:42:57,933][109198] Avg episode reward: [(0, '3.595'), (1, '3.076')] +[2023-09-14 12:42:58,671][93835] Updated weights for policy 0, policy_version 1559 (0.0014) +[2023-09-14 12:43:00,362][93839] Large shaping reward 2.811 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 2.0), ('DAMAGECOUNT', 1.81, 181.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 12:43:02,931][109198] Fps is (10 sec: 13107.1, 60 sec: 13243.8, 300 sec: 11410.3). Total num frames: 9650176. Throughput: 0: 2169.8, 1: 1169.7. Samples: 195057. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:43:02,933][109198] Avg episode reward: [(0, '3.595'), (1, '3.076')] +[2023-09-14 12:43:03,793][93835] Updated weights for policy 0, policy_version 1569 (0.0013) +[2023-09-14 12:43:04,616][93836] Updated weights for policy 1, policy_version 792 (0.0012) +[2023-09-14 12:43:07,931][109198] Fps is (10 sec: 13516.7, 60 sec: 13448.5, 300 sec: 11578.0). Total num frames: 9719808. Throughput: 0: 2121.4, 1: 1192.4. Samples: 215432. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:43:07,933][109198] Avg episode reward: [(0, '3.595'), (1, '3.076')] +[2023-09-14 12:43:08,533][93835] Updated weights for policy 0, policy_version 1579 (0.0014) +[2023-09-14 12:43:12,144][93836] Updated weights for policy 1, policy_version 802 (0.0013) +[2023-09-14 12:43:12,939][109198] Fps is (10 sec: 14324.2, 60 sec: 13514.9, 300 sec: 11774.8). Total num frames: 9793536. Throughput: 0: 2095.0, 1: 1200.4. Samples: 225494. Policy #0 lag: (min: 0.0, avg: 0.6, max: 3.0) +[2023-09-14 12:43:12,942][109198] Avg episode reward: [(0, '3.595'), (1, '3.076')] +[2023-09-14 12:43:13,204][93835] Updated weights for policy 0, policy_version 1589 (0.0015) +[2023-09-14 12:43:16,070][93873] DAMAGECOUNT value on done: 305.0 +[2023-09-14 12:43:16,070][93873] DAMAGECOUNT value on done: 390.0 +[2023-09-14 12:43:16,071][93873] Sum rewards: 3.341, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.037', 'AMMO3': '0.089', 'AMMO4': '0.182', 'weapon5': '0.210', 'weapon2': '0.258', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon4': '0.576', 'WEAPON3': '0.700', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.200', 'weapon3': '2.474'} +[2023-09-14 12:43:16,071][93873] Sum rewards: 7.314, reward structure: {'HEALTH': '-2.050', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.024', 'AMMO3': '0.064', 'weapon2': '0.082', 'AMMO4': '0.118', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.342', 'weapon5': '0.374', 'WEAPON3': '0.600', 'weapon3': '2.994', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.250'} +[2023-09-14 12:43:16,595][93873] DAMAGECOUNT value on done: 322.0 +[2023-09-14 12:43:16,595][93873] DAMAGECOUNT value on done: 395.0 +[2023-09-14 12:43:16,596][93873] Sum rewards: 3.370, reward structure: {'HEALTH': '-1.750', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO4': '0.001', 'AMMO5': '0.008', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon4': '0.112', 'WEAPON5': '0.200', 'weapon2': '0.388', 'WEAPON3': '0.400', 'weapon5': '0.666', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.220', 'weapon3': '1.986'} +[2023-09-14 12:43:16,596][93873] Sum rewards: 1.648, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.008', 'AMMO4': '0.020', 'weapon2': '0.036', 'AMMO3': '0.056', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.366', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.900', 'weapon5': '1.228', 'weapon3': '2.130'} +[2023-09-14 12:43:16,835][93906] DAMAGECOUNT value on done: 160.0 +[2023-09-14 12:43:16,836][93906] DAMAGECOUNT value on done: 40.0 +[2023-09-14 12:43:16,836][93906] Sum rewards: 2.720, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.400', 'weapon2': '0.776', 'weapon5': '1.158', 'weapon3': '1.848'} +[2023-09-14 12:43:17,212][93838] DAMAGECOUNT value on done: 400.0 +[2023-09-14 12:43:17,212][93838] DAMAGECOUNT value on done: 540.0 +[2023-09-14 12:43:17,213][93838] Sum rewards: 3.924, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.015', 'AMMO4': '0.021', 'AMMO3': '0.083', 'WEAPON4': '0.200', 'weapon4': '0.274', 'WEAPON5': '0.300', 'weapon2': '0.346', 'weapon5': '0.634', 'WEAPON3': '0.700', 'FRAGCOUNT': '2.000', 'weapon3': '2.546', 'DAMAGECOUNT': '2.800'} +[2023-09-14 12:43:17,213][93838] Sum rewards: 6.094, reward structure: {'HEALTH': '-2.800', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO4': '0.001', 'AMMO5': '0.015', 'AMMO3': '0.071', 'WEAPON5': '0.300', 'weapon5': '0.448', 'WEAPON3': '0.600', 'weapon2': '0.886', 'weapon3': '2.372', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.200'} +[2023-09-14 12:43:17,584][93906] DAMAGECOUNT value on done: 272.0 +[2023-09-14 12:43:17,586][93906] DAMAGECOUNT value on done: 381.0 +[2023-09-14 12:43:17,587][93906] Sum rewards: 4.282, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.028', 'AMMO3': '0.049', 'weapon2': '0.106', 'AMMO4': '0.138', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.582', 'weapon4': '0.868', 'FRAGCOUNT': '1.000', 'weapon3': '1.080', 'DAMAGECOUNT': '1.770'} +[2023-09-14 12:43:17,590][93906] Sum rewards: 4.088, reward structure: {'HEALTH': '-1.750', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.010', 'AMMO4': '0.021', 'weapon4': '0.034', 'AMMO3': '0.042', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon2': '0.396', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon5': '1.640', 'weapon3': '1.840'} +[2023-09-14 12:43:17,896][93838] DAMAGECOUNT value on done: 485.0 +[2023-09-14 12:43:17,896][93838] DAMAGECOUNT value on done: 560.0 +[2023-09-14 12:43:17,896][93838] Sum rewards: 3.491, reward structure: {'HEALTH': '-3.450', 'DEATHCOUNT': '-3.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'weapon2': '0.010', 'AMMO5': '0.020', 'AMMO3': '0.087', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'weapon4': '0.430', 'WEAPON3': '0.700', 'weapon5': '0.810', 'FRAGCOUNT': '2.000', 'weapon3': '2.534', 'DAMAGECOUNT': '2.750'} +[2023-09-14 12:43:17,897][93838] Sum rewards: 6.882, reward structure: {'HEALTH': '-2.650', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.009', 'AMMO5': '0.015', 'AMMO4': '0.047', 'AMMO3': '0.078', 'WEAPON4': '0.100', 'weapon2': '0.114', 'weapon4': '0.242', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon5': '1.438', 'weapon3': '2.088', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.500'} +[2023-09-14 12:43:17,931][109198] Fps is (10 sec: 13926.6, 60 sec: 13516.8, 300 sec: 11854.3). Total num frames: 9859072. Throughput: 0: 2094.3, 1: 1245.1. Samples: 246504. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:43:17,932][109198] Avg episode reward: [(0, '3.726'), (1, '3.097')] +[2023-09-14 12:43:17,934][93674] Saving new best policy, reward=3.097! +[2023-09-14 12:43:18,170][93835] Updated weights for policy 0, policy_version 1599 (0.0013) +[2023-09-14 12:43:19,520][93836] Updated weights for policy 1, policy_version 812 (0.0012) +[2023-09-14 12:43:19,532][93874] DAMAGECOUNT value on done: 315.0 +[2023-09-14 12:43:19,532][93874] DAMAGECOUNT value on done: 145.0 +[2023-09-14 12:43:19,532][93874] Sum rewards: 6.490, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.724', 'FRAGCOUNT': '1.000', 'weapon5': '1.152', 'weapon3': '2.010', 'DAMAGECOUNT': '2.950'} +[2023-09-14 12:43:19,756][93839] DAMAGECOUNT value on done: 280.0 +[2023-09-14 12:43:19,756][93839] DAMAGECOUNT value on done: 481.0 +[2023-09-14 12:43:19,757][93839] Sum rewards: 5.497, reward structure: {'HEALTH': '-0.200', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon5': '0.492', 'weapon3': '0.866', 'FRAGCOUNT': '1.000', 'weapon2': '1.076', 'DAMAGECOUNT': '1.910'} +[2023-09-14 12:43:19,923][93873] DAMAGECOUNT value on done: 125.0 +[2023-09-14 12:43:19,924][93873] DAMAGECOUNT value on done: 170.0 +[2023-09-14 12:43:19,924][93873] Sum rewards: 2.701, reward structure: {'HEALTH': '-2.050', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO3': '0.062', 'WEAPON4': '0.100', 'weapon4': '0.188', 'WEAPON5': '0.300', 'weapon2': '0.342', 'weapon5': '0.360', 'WEAPON3': '0.600', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '2.742'} +[2023-09-14 12:43:19,925][93873] Sum rewards: 3.962, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.037', 'AMMO3': '0.039', 'weapon2': '0.098', 'WEAPON5': '0.100', 'AMMO4': '0.186', 'WEAPON4': '0.200', 'weapon5': '0.328', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon4': '1.044', 'DAMAGECOUNT': '1.050', 'weapon3': '1.474'} +[2023-09-14 12:43:20,164][93874] DAMAGECOUNT value on done: 225.0 +[2023-09-14 12:43:20,164][93874] DAMAGECOUNT value on done: 275.0 +[2023-09-14 12:43:20,164][93874] Sum rewards: 3.490, reward structure: {'HEALTH': '-2.050', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.008', 'AMMO5': '0.015', 'AMMO4': '0.040', 'AMMO3': '0.065', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon2': '0.356', 'weapon4': '0.366', 'weapon5': '0.564', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.500', 'weapon3': '2.526'} +[2023-09-14 12:43:20,165][93874] Sum rewards: 6.146, reward structure: {'HEALTH': '-1.640', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.013', 'AMMO3': '0.049', 'AMMO4': '0.062', 'WEAPON4': '0.100', 'weapon4': '0.162', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.722', 'weapon5': '1.288', 'weapon3': '1.632', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150'} +[2023-09-14 12:43:20,347][93839] DAMAGECOUNT value on done: 210.0 +[2023-09-14 12:43:20,347][93839] Sum rewards: 3.102, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.036', 'AMMO3': '0.078', 'AMMO4': '0.181', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon5': '0.356', 'weapon2': '0.490', 'WEAPON3': '0.600', 'weapon4': '0.826', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.500', 'weapon3': '1.524'} +[2023-09-14 12:43:20,347][93839] DAMAGECOUNT value on done: 210.0 +[2023-09-14 12:43:20,348][93839] Sum rewards: 6.092, reward structure: {'HEALTH': '-1.450', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.010', 'AMMO4': '0.018', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.240', 'WEAPON3': '0.400', 'weapon2': '0.436', 'weapon5': '0.970', 'FRAGCOUNT': '2.000', 'weapon3': '2.024', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:43:20,496][93873] DAMAGECOUNT value on done: 90.0 +[2023-09-14 12:43:20,496][93873] DAMAGECOUNT value on done: 185.0 +[2023-09-14 12:43:20,497][93873] Sum rewards: 2.751, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.043', 'AMMO2': '-0.009', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'DAMAGECOUNT': '0.150', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.640', 'weapon5': '1.310', 'weapon3': '2.054'} +[2023-09-14 12:43:20,511][93906] DAMAGECOUNT value on done: 450.0 +[2023-09-14 12:43:20,512][93906] DAMAGECOUNT value on done: 190.0 +[2023-09-14 12:43:20,512][93906] Sum rewards: 9.360, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.027', 'AMMO3': '0.072', 'AMMO4': '0.133', 'weapon5': '0.296', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon4': '0.330', 'WEAPON3': '0.600', 'weapon2': '0.678', 'weapon3': '2.410', 'FRAGCOUNT': '3.999', 'DAMAGECOUNT': '4.200'} +[2023-09-14 12:43:20,513][93906] Sum rewards: 0.238, reward structure: {'HEALTH': '-4.000', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'weapon5': '0.032', 'AMMO2': '0.045', 'AMMO3': '0.105', 'AMMO4': '0.224', 'WEAPON4': '0.300', 'weapon2': '0.314', 'weapon4': '0.348', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.700', 'weapon3': '2.950'} +[2023-09-14 12:43:20,931][93839] DAMAGECOUNT value on done: 55.0 +[2023-09-14 12:43:20,932][93839] Sum rewards: 2.321, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.250', 'WEAPON3': '0.400', 'weapon2': '0.788', 'weapon5': '1.128', 'weapon3': '1.866'} +[2023-09-14 12:43:20,932][93839] DAMAGECOUNT value on done: 64.0 +[2023-09-14 12:43:21,152][93906] DAMAGECOUNT value on done: 215.0 +[2023-09-14 12:43:21,152][93906] DAMAGECOUNT value on done: 365.0 +[2023-09-14 12:43:21,153][93906] Sum rewards: 7.991, reward structure: {'HEALTH': '-0.150', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.682', 'weapon3': '1.010', 'DAMAGECOUNT': '2.000', 'FRAGCOUNT': '2.000', 'weapon5': '2.154'} +[2023-09-14 12:43:21,248][93871] DAMAGECOUNT value on done: 124.0 +[2023-09-14 12:43:21,249][93871] DAMAGECOUNT value on done: 140.0 +[2023-09-14 12:43:21,675][93839] DAMAGECOUNT value on done: 284.0 +[2023-09-14 12:43:21,676][93839] DAMAGECOUNT value on done: 172.0 +[2023-09-14 12:43:21,896][93871] DAMAGECOUNT value on done: 352.0 +[2023-09-14 12:43:21,896][93871] DAMAGECOUNT value on done: 320.0 +[2023-09-14 12:43:21,897][93871] Sum rewards: 4.140, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO4': '0.025', 'AMMO3': '0.057', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.364', 'weapon4': '0.414', 'WEAPON3': '0.500', 'weapon5': '0.648', 'weapon3': '1.402', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.420'} +[2023-09-14 12:43:21,897][93871] Sum rewards: 4.437, reward structure: {'HEALTH': '-2.420', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'weapon5': '0.022', 'AMMO2': '0.032', 'AMMO3': '0.052', 'WEAPON5': '0.100', 'AMMO4': '0.161', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon2': '0.628', 'weapon4': '1.084', 'weapon3': '1.772', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.200'} +[2023-09-14 12:43:22,335][93837] DAMAGECOUNT value on done: 257.0 +[2023-09-14 12:43:22,335][93837] DAMAGECOUNT value on done: 90.0 +[2023-09-14 12:43:22,336][93837] Sum rewards: 4.450, reward structure: {'HEALTH': '-1.160', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.014', 'AMMO3': '0.043', 'AMMO4': '0.068', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.240', 'weapon2': '0.396', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.800', 'FRAGCOUNT': '0.999', 'weapon5': '1.518', 'weapon3': '1.724'} +[2023-09-14 12:43:22,484][93871] DAMAGECOUNT value on done: 286.0 +[2023-09-14 12:43:22,484][93871] DAMAGECOUNT value on done: 91.0 +[2023-09-14 12:43:22,484][93871] Sum rewards: 2.942, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'weapon5': '0.268', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.740', 'weapon2': '1.276', 'weapon3': '2.190'} +[2023-09-14 12:43:22,906][93837] DAMAGECOUNT value on done: 250.0 +[2023-09-14 12:43:22,907][93837] Sum rewards: 4.995, reward structure: {'HEALTH': '-2.300', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.036', 'AMMO3': '0.076', 'weapon2': '0.150', 'AMMO4': '0.181', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.562', 'WEAPON3': '0.600', 'weapon5': '0.692', 'FRAGCOUNT': '2.000', 'weapon3': '2.182', 'DAMAGECOUNT': '2.200'} +[2023-09-14 12:43:22,906][93837] DAMAGECOUNT value on done: 260.0 +[2023-09-14 12:43:22,907][93837] Sum rewards: 3.561, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.026', 'weapon2': '0.042', 'AMMO3': '0.080', 'AMMO4': '0.128', 'weapon5': '0.238', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon4': '0.382', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.300', 'weapon3': '3.052'} +[2023-09-14 12:43:22,931][109198] Fps is (10 sec: 13118.1, 60 sec: 13380.3, 300 sec: 11923.9). Total num frames: 9924608. Throughput: 0: 2048.3, 1: 1312.1. Samples: 266175. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:43:22,933][109198] Avg episode reward: [(0, '3.846'), (1, '3.154')] +[2023-09-14 12:43:22,937][93674] Saving new best policy, reward=3.154! +[2023-09-14 12:43:23,097][93871] DAMAGECOUNT value on done: 155.0 +[2023-09-14 12:43:23,097][93871] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:43:23,098][93871] Sum rewards: 4.189, reward structure: {'HEALTH': '-1.450', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.260', 'weapon2': '0.354', 'WEAPON3': '0.400', 'FRAGCOUNT': '0.999', 'weapon5': '1.018', 'DAMAGECOUNT': '1.350', 'weapon3': '1.940'} +[2023-09-14 12:43:23,613][93838] DAMAGECOUNT value on done: 245.0 +[2023-09-14 12:43:23,613][93838] DAMAGECOUNT value on done: 199.0 +[2023-09-14 12:43:23,614][93838] Sum rewards: 2.988, reward structure: {'HEALTH': '-1.750', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.030', 'AMMO4': '0.097', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.290', 'WEAPON3': '0.300', 'weapon5': '0.390', 'weapon4': '0.556', 'FRAGCOUNT': '1.000', 'weapon3': '1.050', 'DAMAGECOUNT': '1.700'} +[2023-09-14 12:43:23,614][93838] Sum rewards: 2.649, reward structure: {'HEALTH': '-1.700', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.020', 'AMMO3': '0.038', 'AMMO4': '0.099', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.312', 'weapon4': '0.744', 'weapon3': '0.846', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.790'} +[2023-09-14 12:43:23,913][93874] DAMAGECOUNT value on done: 275.0 +[2023-09-14 12:43:23,913][93874] DAMAGECOUNT value on done: 275.0 +[2023-09-14 12:43:23,914][93874] Sum rewards: 2.247, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.004', 'AMMO3': '0.038', 'WEAPON5': '0.100', 'WEAPON3': '0.300', 'weapon2': '0.376', 'weapon3': '0.998', 'weapon5': '2.464'} +[2023-09-14 12:43:24,194][93838] DAMAGECOUNT value on done: 115.0 +[2023-09-14 12:43:24,195][93838] DAMAGECOUNT value on done: 200.0 +[2023-09-14 12:43:24,195][93838] Sum rewards: 5.739, reward structure: {'HEALTH': '-0.850', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.030', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon2': '0.100', 'AMMO4': '0.150', 'WEAPON3': '0.200', 'weapon3': '0.752', 'weapon4': '0.814', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon5': '2.168'} +[2023-09-14 12:43:24,229][93835] Updated weights for policy 0, policy_version 1609 (0.0013) +[2023-09-14 12:43:24,589][93874] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:43:24,590][93874] DAMAGECOUNT value on done: 135.0 +[2023-09-14 12:43:24,590][93874] Sum rewards: 4.595, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.035', 'weapon2': '0.038', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.210', 'WEAPON3': '0.300', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '1.060', 'weapon5': '2.748'} +[2023-09-14 12:43:25,611][93987] DAMAGECOUNT value on done: 160.0 +[2023-09-14 12:43:25,611][93987] DAMAGECOUNT value on done: 40.0 +[2023-09-14 12:43:25,612][93987] Sum rewards: 3.080, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.014', 'AMMO3': '0.040', 'AMMO4': '0.071', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon2': '0.308', 'weapon4': '0.362', 'WEAPON3': '0.400', 'weapon5': '0.736', 'DAMAGECOUNT': '0.850', 'weapon3': '1.990'} +[2023-09-14 12:43:25,704][93836] Updated weights for policy 1, policy_version 822 (0.0012) +[2023-09-14 12:43:26,324][93987] DAMAGECOUNT value on done: 450.0 +[2023-09-14 12:43:26,324][93987] DAMAGECOUNT value on done: 355.0 +[2023-09-14 12:43:26,325][93987] Sum rewards: 5.753, reward structure: {'HEALTH': '-0.650', 'HITCOUNT': '0.000', 'AMMO3': '0.020', 'AMMO2': '0.025', 'WEAPON4': '0.100', 'AMMO4': '0.124', 'WEAPON3': '0.200', 'weapon2': '0.490', 'weapon4': '0.584', 'weapon3': '0.810', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:43:26,452][93837] DAMAGECOUNT value on done: 305.0 +[2023-09-14 12:43:26,453][93837] DAMAGECOUNT value on done: 315.0 +[2023-09-14 12:43:26,453][93837] Sum rewards: 1.703, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO3': '0.066', 'WEAPON5': '0.300', 'weapon5': '0.498', 'WEAPON3': '0.600', 'weapon2': '0.722', 'DAMAGECOUNT': '0.850', 'weapon3': '2.714'} +[2023-09-14 12:43:26,454][93837] Sum rewards: 3.644, reward structure: {'HEALTH': '-0.850', 'HITCOUNT': '0.000', 'AMMO3': '0.020', 'AMMO2': '0.035', 'WEAPON4': '0.100', 'weapon2': '0.130', 'AMMO4': '0.175', 'WEAPON3': '0.200', 'weapon3': '0.782', 'weapon4': '0.902', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150'} +[2023-09-14 12:43:26,792][93987] DAMAGECOUNT value on done: 250.0 +[2023-09-14 12:43:26,792][93987] DAMAGECOUNT value on done: 445.0 +[2023-09-14 12:43:26,792][93987] Sum rewards: 0.280, reward structure: {'HEALTH': '-4.050', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.036', 'weapon2': '0.094', 'AMMO3': '0.118', 'AMMO4': '0.182', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'weapon4': '0.502', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon5': '1.074', 'DAMAGECOUNT': '1.650', 'weapon3': '2.154'} +[2023-09-14 12:43:26,793][93987] Sum rewards: 9.505, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.013', 'AMMO4': '0.022', 'AMMO3': '0.067', 'weapon2': '0.136', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.306', 'WEAPON3': '0.600', 'weapon5': '0.776', 'weapon3': '2.732', 'FRAGCOUNT': '3.999', 'DAMAGECOUNT': '4.350'} +[2023-09-14 12:43:27,077][93837] DAMAGECOUNT value on done: 335.0 +[2023-09-14 12:43:27,077][93837] DAMAGECOUNT value on done: 195.0 +[2023-09-14 12:43:27,078][93837] Sum rewards: 2.487, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.033', 'AMMO2': '-0.007', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'DAMAGECOUNT': '0.150', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.570', 'weapon5': '1.326', 'weapon3': '1.882'} +[2023-09-14 12:43:27,501][93987] DAMAGECOUNT value on done: 447.0 +[2023-09-14 12:43:27,502][93987] DAMAGECOUNT value on done: 325.0 +[2023-09-14 12:43:27,502][93987] Sum rewards: 4.031, reward structure: {'HEALTH': '-0.250', 'HITCOUNT': '0.000', 'AMMO3': '0.020', 'weapon2': '0.028', 'AMMO2': '0.030', 'WEAPON4': '0.100', 'AMMO4': '0.149', 'WEAPON3': '0.200', 'weapon3': '0.744', 'weapon4': '0.810', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.200'} +[2023-09-14 12:43:27,502][93987] Sum rewards: 0.964, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.053', 'AMMO2': '-0.010', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO3': '0.075', 'DAMAGECOUNT': '0.250', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon5': '0.652', 'weapon2': '0.972', 'weapon3': '2.164'} +[2023-09-14 12:43:27,931][109198] Fps is (10 sec: 13516.8, 60 sec: 13448.6, 300 sec: 12029.3). Total num frames: 9994240. Throughput: 0: 2023.1, 1: 1349.0. Samples: 275989. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:43:27,933][109198] Avg episode reward: [(0, '3.771'), (1, '3.227')] +[2023-09-14 12:43:27,934][93674] Saving new best policy, reward=3.227! +[2023-09-14 12:43:30,217][93835] Updated weights for policy 0, policy_version 1619 (0.0012) +[2023-09-14 12:43:31,387][93836] Updated weights for policy 1, policy_version 832 (0.0012) +[2023-09-14 12:43:32,931][109198] Fps is (10 sec: 13926.4, 60 sec: 13516.8, 300 sec: 12124.2). Total num frames: 10063872. Throughput: 0: 1975.6, 1: 1429.5. Samples: 296715. Policy #0 lag: (min: 0.0, avg: 0.7, max: 1.0) +[2023-09-14 12:43:32,933][109198] Avg episode reward: [(0, '3.771'), (1, '3.227')] +[2023-09-14 12:43:34,265][109198] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 109198], exiting... +[2023-09-14 12:43:34,267][93585] Stopping Batcher_0... +[2023-09-14 12:43:34,267][93674] Stopping Batcher_1... +[2023-09-14 12:43:34,267][93674] Loop batcher_evt_loop terminating... +[2023-09-14 12:43:34,267][93585] Loop batcher_evt_loop terminating... +[2023-09-14 12:43:34,267][109198] Runner profile tree view: +main_loop: 108.8521 +[2023-09-14 12:43:34,268][93674] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000837_3428352.pth... +[2023-09-14 12:43:34,268][93585] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001625_6656000.pth... +[2023-09-14 12:43:34,268][109198] Collected {0: 6656000, 1: 3428352}, FPS: 11326.3 +[2023-09-14 12:43:34,287][93836] Weights refcount: 2 0 +[2023-09-14 12:43:34,289][93836] Stopping InferenceWorker_p1-w0... +[2023-09-14 12:43:34,289][93836] Loop inference_proc1-0_evt_loop terminating... +[2023-09-14 12:43:34,289][93835] Weights refcount: 2 0 +[2023-09-14 12:43:34,290][93835] Stopping InferenceWorker_p0-w0... +[2023-09-14 12:43:34,291][93835] Loop inference_proc0-0_evt_loop terminating... +[2023-09-14 12:43:34,328][93585] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001368_5603328.pth +[2023-09-14 12:43:34,331][93674] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000651_2666496.pth +[2023-09-14 12:43:34,336][93585] Stopping LearnerWorker_p0... +[2023-09-14 12:43:34,336][93585] Loop learner_proc0_evt_loop terminating... +[2023-09-14 12:43:34,338][93674] Stopping LearnerWorker_p1... +[2023-09-14 12:43:34,339][93674] Loop learner_proc1_evt_loop terminating... +[2023-09-14 12:43:35,070][93873] Stopping RolloutWorker_w4... +[2023-09-14 12:43:35,071][93873] Loop rollout_proc4_evt_loop terminating... +[2023-09-14 12:43:35,072][93906] Stopping RolloutWorker_w6... +[2023-09-14 12:43:35,073][93906] Loop rollout_proc6_evt_loop terminating... +[2023-09-14 12:43:35,073][93871] Stopping RolloutWorker_w3... +[2023-09-14 12:43:35,074][93871] Loop rollout_proc3_evt_loop terminating... +[2023-09-14 12:43:35,075][93837] Stopping RolloutWorker_w0... +[2023-09-14 12:43:35,076][93837] Loop rollout_proc0_evt_loop terminating... +[2023-09-14 12:43:35,077][93839] Stopping RolloutWorker_w2... +[2023-09-14 12:43:35,078][93839] Loop rollout_proc2_evt_loop terminating... +[2023-09-14 12:43:35,078][93874] Stopping RolloutWorker_w5... +[2023-09-14 12:43:35,079][93874] Loop rollout_proc5_evt_loop terminating... +[2023-09-14 12:43:35,095][93987] Stopping RolloutWorker_w7... +[2023-09-14 12:43:35,095][93987] Loop rollout_proc7_evt_loop terminating... +[2023-09-14 12:43:35,102][93838] Stopping RolloutWorker_w1... +[2023-09-14 12:43:35,103][93838] Loop rollout_proc1_evt_loop terminating... +[2023-09-14 12:43:49,514][109198] Environment doom_basic already registered, overwriting... +[2023-09-14 12:43:49,517][109198] Environment doom_two_colors_easy already registered, overwriting... +[2023-09-14 12:43:49,518][109198] Environment doom_two_colors_hard already registered, overwriting... +[2023-09-14 12:43:49,520][109198] Environment doom_dm already registered, overwriting... +[2023-09-14 12:43:49,521][109198] Environment doom_dwango5 already registered, overwriting... +[2023-09-14 12:43:49,522][109198] Environment doom_my_way_home_flat_actions already registered, overwriting... +[2023-09-14 12:43:49,523][109198] Environment doom_defend_the_center_flat_actions already registered, overwriting... +[2023-09-14 12:43:49,524][109198] Environment doom_my_way_home already registered, overwriting... +[2023-09-14 12:43:49,525][109198] Environment doom_deadly_corridor already registered, overwriting... +[2023-09-14 12:43:49,527][109198] Environment doom_defend_the_center already registered, overwriting... +[2023-09-14 12:43:49,528][109198] Environment doom_defend_the_line already registered, overwriting... +[2023-09-14 12:43:49,529][109198] Environment doom_health_gathering already registered, overwriting... +[2023-09-14 12:43:49,531][109198] Environment doom_health_gathering_supreme already registered, overwriting... +[2023-09-14 12:43:49,532][109198] Environment doom_battle already registered, overwriting... +[2023-09-14 12:43:49,533][109198] Environment doom_battle2 already registered, overwriting... +[2023-09-14 12:43:49,534][109198] Environment doom_duel_bots already registered, overwriting... +[2023-09-14 12:43:49,535][109198] Environment doom_deathmatch_bots already registered, overwriting... +[2023-09-14 12:43:49,536][109198] Environment doom_duel already registered, overwriting... +[2023-09-14 12:43:49,537][109198] Environment doom_deathmatch_full already registered, overwriting... +[2023-09-14 12:43:49,538][109198] Environment doom_benchmark already registered, overwriting... +[2023-09-14 12:43:49,539][109198] register_encoder_factory: +[2023-09-14 12:43:49,566][109198] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json +[2023-09-14 12:43:49,571][109198] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists! +[2023-09-14 12:43:49,572][109198] Resuming existing experiment from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment... +[2023-09-14 12:43:49,574][109198] Weights and Biases integration disabled +[2023-09-14 12:43:49,577][109198] Environment var CUDA_VISIBLE_DEVICES is 0,1 + +[2023-09-14 12:43:51,688][109198] Starting experiment with the following configuration: +help=False +algo=APPO +env=doom_duel +experiment=default_experiment +train_dir=/home/cogstack/Documents/optuna/environments/sample_factory/train_dir +restart_behavior=resume +device=gpu +seed=None +num_policies=2 +async_rl=True +serial_mode=False +batched_sampling=False +num_batches_to_accumulate=2 +worker_num_splits=2 +policy_workers_per_policy=1 +max_policy_lag=1000 +num_workers=8 +num_envs_per_worker=4 +batch_size=1024 +num_batches_per_epoch=1 +num_epochs=1 +rollout=32 +recurrence=32 +shuffle_minibatches=False +gamma=0.99 +reward_scale=1.0 +reward_clip=1000.0 +value_bootstrap=False +normalize_returns=True +exploration_loss_coeff=0.001 +value_loss_coeff=0.5 +kl_loss_coeff=0.0 +exploration_loss=symmetric_kl +gae_lambda=0.95 +ppo_clip_ratio=0.1 +ppo_clip_value=0.2 +with_vtrace=False +vtrace_rho=1.0 +vtrace_c=1.0 +optimizer=adam +adam_eps=1e-06 +adam_beta1=0.9 +adam_beta2=0.999 +max_grad_norm=4.0 +learning_rate=0.0001 +lr_schedule=constant +lr_schedule_kl_threshold=0.008 +lr_adaptive_min=1e-06 +lr_adaptive_max=0.01 +obs_subtract_mean=0.0 +obs_scale=255.0 +normalize_input=True +normalize_input_keys=None +decorrelate_experience_max_seconds=0 +decorrelate_envs_on_one_worker=True +actor_worker_gpus=[] +set_workers_cpu_affinity=True +force_envs_single_thread=False +default_niceness=0 +log_to_file=True +experiment_summaries_interval=10 +flush_summaries_interval=30 +stats_avg=100 +summaries_use_frameskip=True +heartbeat_interval=20 +heartbeat_reporting_interval=600 +train_for_env_steps=10000000 +train_for_seconds=10000000000 +save_every_sec=120 +keep_checkpoints=2 +load_checkpoint_kind=latest +save_milestones_sec=-1 +save_best_every_sec=5 +save_best_metric=reward +save_best_after=100000 +benchmark=False +encoder_mlp_layers=[512, 512] +encoder_conv_architecture=convnet_simple +encoder_conv_mlp_layers=[512] +use_rnn=True +rnn_size=512 +rnn_type=gru +rnn_num_layers=1 +decoder_mlp_layers=[] +nonlinearity=elu +policy_initialization=orthogonal +policy_init_gain=1.0 +actor_critic_share_weights=True +adaptive_stddev=True +continuous_tanh_scale=0.0 +initial_stddev=1.0 +use_env_info_cache=False +env_gpu_actions=False +env_gpu_observations=True +env_frameskip=4 +env_framestack=1 +pixel_format=CHW +use_record_episode_statistics=False +with_wandb=False +wandb_user=None +wandb_project=sample_factory +wandb_group=None +wandb_job_type=SF +wandb_tags=[] +with_pbt=False +pbt_mix_policies_in_one_env=True +pbt_period_env_steps=5000000 +pbt_start_mutation=20000000 +pbt_replace_fraction=0.3 +pbt_mutation_rate=0.15 +pbt_replace_reward_gap=0.1 +pbt_replace_reward_gap_absolute=1e-06 +pbt_optimize_gamma=False +pbt_target_objective=true_objective +pbt_perturb_min=1.1 +pbt_perturb_max=1.5 +num_agents=-1 +num_humans=0 +num_bots=-1 +start_bot_difficulty=None +timelimit=None +res_w=128 +res_h=72 +wide_aspect_ratio=False +eval_env_frameskip=1 +fps=35 +command_line=--env=doom_dm --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=20000000 +cli_args={'env': 'doom_dm', 'num_workers': 8, 'num_envs_per_worker': 4, 'train_for_env_steps': 20000000} +git_hash=20b6d44612dad7d171f23e13b1f3b4c5e5631cf9 +git_repo_name=https://github.com/MattStammers/optuna.git +[2023-09-14 12:43:51,690][109198] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... +[2023-09-14 12:43:51,808][109198] Rollout worker 0 uses device cpu +[2023-09-14 12:43:51,810][109198] Rollout worker 1 uses device cpu +[2023-09-14 12:43:51,811][109198] Rollout worker 2 uses device cpu +[2023-09-14 12:43:51,812][109198] Rollout worker 3 uses device cpu +[2023-09-14 12:43:51,812][109198] Rollout worker 4 uses device cpu +[2023-09-14 12:43:51,814][109198] Rollout worker 5 uses device cpu +[2023-09-14 12:43:51,815][109198] Rollout worker 6 uses device cpu +[2023-09-14 12:43:51,816][109198] Rollout worker 7 uses device cpu +[2023-09-14 12:43:51,881][109198] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:43:51,882][109198] InferenceWorker_p0-w0: min num requests: 1 +[2023-09-14 12:43:51,886][109198] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:43:51,887][109198] InferenceWorker_p1-w0: min num requests: 1 +[2023-09-14 12:43:51,913][109198] Starting all processes... +[2023-09-14 12:43:51,914][109198] Starting process learner_proc0 +[2023-09-14 12:43:53,503][109198] Starting process learner_proc1 +[2023-09-14 12:43:53,505][101718] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:43:53,505][101718] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 +[2023-09-14 12:43:53,541][101718] Num visible devices: 1 +[2023-09-14 12:43:53,584][101718] Starting seed is not provided +[2023-09-14 12:43:53,584][101718] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:43:53,584][101718] Initializing actor-critic model on device cuda:0 +[2023-09-14 12:43:53,585][101718] RunningMeanStd input shape: (23,) +[2023-09-14 12:43:53,585][101718] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:43:53,586][101718] RunningMeanStd input shape: (1,) +[2023-09-14 12:43:53,597][101718] ConvEncoder: input_channels=3 +[2023-09-14 12:43:53,727][101718] Conv encoder output size: 512 +[2023-09-14 12:43:53,728][101718] Policy head output size: 640 +[2023-09-14 12:43:53,745][101718] Created Actor Critic model with architecture: +[2023-09-14 12:43:53,745][101718] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (measurements): RunningMeanStdInPlace() + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): VizdoomEncoder( + (basic_encoder): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ELU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ELU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ELU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ELU) + ) + ) + ) + (measurements_head): Sequential( + (0): Linear(in_features=23, out_features=128, bias=True) + (1): ELU(alpha=1.0) + (2): Linear(in_features=128, out_features=128, bias=True) + (3): ELU(alpha=1.0) + ) + ) + (core): ModelCoreRNN( + (core): GRU(640, 512) + ) + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=41, bias=True) + ) +) +[2023-09-14 12:43:54,751][101718] Using optimizer +[2023-09-14 12:43:54,752][101718] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001625_6656000.pth... +[2023-09-14 12:43:54,783][101718] Loading model from checkpoint +[2023-09-14 12:43:54,789][101718] Loaded experiment state at self.train_step=1625, self.env_steps=6656000 +[2023-09-14 12:43:54,789][101718] Initialized policy 0 weights for model version 1625 +[2023-09-14 12:43:54,791][101718] LearnerWorker_p0 finished initialization! +[2023-09-14 12:43:54,791][101718] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:43:55,180][101802] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:43:55,180][101802] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for learning process 1 +[2023-09-14 12:43:55,179][109198] Starting all processes... +[2023-09-14 12:43:55,184][109198] Starting process inference_proc0-0 +[2023-09-14 12:43:55,184][109198] Starting process inference_proc1-0 +[2023-09-14 12:43:55,198][101802] Num visible devices: 1 +[2023-09-14 12:43:55,185][109198] Starting process rollout_proc0 +[2023-09-14 12:43:55,187][109198] Starting process rollout_proc1 +[2023-09-14 12:43:55,188][109198] Starting process rollout_proc2 +[2023-09-14 12:43:55,227][101802] Starting seed is not provided +[2023-09-14 12:43:55,227][101802] Using GPUs [0] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:43:55,227][101802] Initializing actor-critic model on device cuda:0 +[2023-09-14 12:43:55,228][101802] RunningMeanStd input shape: (23,) +[2023-09-14 12:43:55,229][101802] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:43:55,229][101802] RunningMeanStd input shape: (1,) +[2023-09-14 12:43:55,243][101802] ConvEncoder: input_channels=3 +[2023-09-14 12:43:55,188][109198] Starting process rollout_proc3 +[2023-09-14 12:43:55,189][109198] Starting process rollout_proc4 +[2023-09-14 12:43:55,190][109198] Starting process rollout_proc5 +[2023-09-14 12:43:55,190][109198] Starting process rollout_proc6 +[2023-09-14 12:43:55,190][109198] Starting process rollout_proc7 +[2023-09-14 12:43:55,476][101802] Conv encoder output size: 512 +[2023-09-14 12:43:55,477][101802] Policy head output size: 640 +[2023-09-14 12:43:55,506][101802] Created Actor Critic model with architecture: +[2023-09-14 12:43:55,506][101802] ActorCriticSharedWeights( + (obs_normalizer): ObservationNormalizer( + (running_mean_std): RunningMeanStdDictInPlace( + (running_mean_std): ModuleDict( + (measurements): RunningMeanStdInPlace() + (obs): RunningMeanStdInPlace() + ) + ) + ) + (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) + (encoder): VizdoomEncoder( + (basic_encoder): ConvEncoder( + (enc): RecursiveScriptModule( + original_name=ConvEncoderImpl + (conv_head): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Conv2d) + (1): RecursiveScriptModule(original_name=ELU) + (2): RecursiveScriptModule(original_name=Conv2d) + (3): RecursiveScriptModule(original_name=ELU) + (4): RecursiveScriptModule(original_name=Conv2d) + (5): RecursiveScriptModule(original_name=ELU) + ) + (mlp_layers): RecursiveScriptModule( + original_name=Sequential + (0): RecursiveScriptModule(original_name=Linear) + (1): RecursiveScriptModule(original_name=ELU) + ) + ) + ) + (measurements_head): Sequential( + (0): Linear(in_features=23, out_features=128, bias=True) + (1): ELU(alpha=1.0) + (2): Linear(in_features=128, out_features=128, bias=True) + (3): ELU(alpha=1.0) + ) + ) + (core): ModelCoreRNN( + (core): GRU(640, 512) + ) + (decoder): MlpDecoder( + (mlp): Identity() + ) + (critic_linear): Linear(in_features=512, out_features=1, bias=True) + (action_parameterization): ActionParameterizationDefault( + (distribution_linear): Linear(in_features=512, out_features=41, bias=True) + ) +) +[2023-09-14 12:43:56,906][101802] Using optimizer +[2023-09-14 12:43:56,907][101802] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000837_3428352.pth... +[2023-09-14 12:43:56,947][101802] Loading model from checkpoint +[2023-09-14 12:43:56,956][101802] Loaded experiment state at self.train_step=837, self.env_steps=3428352 +[2023-09-14 12:43:56,957][101802] Initialized policy 1 weights for model version 837 +[2023-09-14 12:43:56,959][101802] LearnerWorker_p1 finished initialization! +[2023-09-14 12:43:56,959][101802] Using GPUs [0] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:43:57,265][102003] Worker 1 uses CPU cores [4, 5, 6, 7] +[2023-09-14 12:43:57,455][102004] Worker 2 uses CPU cores [8, 9, 10, 11] +[2023-09-14 12:43:57,478][101964] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-09-14 12:43:57,478][101964] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for inference process 1 +[2023-09-14 12:43:57,481][101965] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 12:43:57,481][101965] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 +[2023-09-14 12:43:57,483][102005] Worker 3 uses CPU cores [12, 13, 14, 15] +[2023-09-14 12:43:57,499][101964] Num visible devices: 1 +[2023-09-14 12:43:57,499][101965] Num visible devices: 1 +[2023-09-14 12:43:57,600][102040] Worker 6 uses CPU cores [24, 25, 26, 27] +[2023-09-14 12:43:57,617][102046] Worker 7 uses CPU cores [28, 29, 30, 31] +[2023-09-14 12:43:57,644][102037] Worker 4 uses CPU cores [16, 17, 18, 19] +[2023-09-14 12:43:57,788][102039] Worker 5 uses CPU cores [20, 21, 22, 23] +[2023-09-14 12:43:57,823][102001] Worker 0 uses CPU cores [0, 1, 2, 3] +[2023-09-14 12:43:58,263][101965] RunningMeanStd input shape: (23,) +[2023-09-14 12:43:58,264][101965] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:43:58,264][101965] RunningMeanStd input shape: (1,) +[2023-09-14 12:43:58,282][101965] ConvEncoder: input_channels=3 +[2023-09-14 12:43:58,294][101964] RunningMeanStd input shape: (23,) +[2023-09-14 12:43:58,294][101964] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 12:43:58,294][101964] RunningMeanStd input shape: (1,) +[2023-09-14 12:43:58,306][101964] ConvEncoder: input_channels=3 +[2023-09-14 12:43:58,388][101965] Conv encoder output size: 512 +[2023-09-14 12:43:58,389][101965] Policy head output size: 640 +[2023-09-14 12:43:58,409][101964] Conv encoder output size: 512 +[2023-09-14 12:43:58,410][101964] Policy head output size: 640 +[2023-09-14 12:43:58,673][109198] Inference worker 0-0 is ready! +[2023-09-14 12:43:58,693][109198] Inference worker 1-0 is ready! +[2023-09-14 12:43:58,694][109198] All inference workers are ready! Signal rollout workers to start! +[2023-09-14 12:43:58,698][102040] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,698][102046] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,698][102003] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,698][102037] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,699][102039] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,699][102005] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,699][102001] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,702][102004] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,728][102040] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:43:58,729][102046] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:43:58,731][102040] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,731][102001] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:43:58,731][102046] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,731][102005] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:43:58,733][102004] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:43:58,734][102001] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,735][102005] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,737][102004] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,745][102039] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:43:58,745][102003] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:43:58,746][102037] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 12:43:58,749][102039] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,749][102003] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,750][102037] Multi agent env, num agents: 2 +[2023-09-14 12:43:58,760][102046] UDP port 41000 cannot be used [Errno 98] Address already in use +[2023-09-14 12:43:58,761][102040] Port 40900 is available +[2023-09-14 12:43:58,761][102040] Using port 40900 +[2023-09-14 12:43:58,761][102046] Port 42000 is available +[2023-09-14 12:43:58,761][102046] Using port 42000 +[2023-09-14 12:43:58,762][102040] Initializing env for player 0, init_info: {'port': 40900}... +[2023-09-14 12:43:58,762][102046] Initializing env for player 0, init_info: {'port': 42000}... +[2023-09-14 12:43:58,763][102001] Port 40300 is available +[2023-09-14 12:43:58,763][102001] Using port 40300 +[2023-09-14 12:43:58,764][102001] Initializing env for player 0, init_info: {'port': 40300}... +[2023-09-14 12:43:58,764][102005] Port 40600 is available +[2023-09-14 12:43:58,765][102005] Using port 40600 +[2023-09-14 12:43:58,766][102005] Initializing env for player 0, init_info: {'port': 40600}... +[2023-09-14 12:43:58,766][102004] Port 40500 is available +[2023-09-14 12:43:58,766][102004] Using port 40500 +[2023-09-14 12:43:58,767][102004] Initializing env for player 0, init_info: {'port': 40500}... +[2023-09-14 12:43:58,790][102046] Using port 42000 on host... +[2023-09-14 12:43:58,794][102005] Using port 40600 on host... +[2023-09-14 12:43:58,795][102004] Using port 40500 on host... +[2023-09-14 12:43:58,795][102003] Port 40400 is available +[2023-09-14 12:43:58,795][102037] Port 40700 is available +[2023-09-14 12:43:58,795][102003] Using port 40400 +[2023-09-14 12:43:58,796][102037] Using port 40700 +[2023-09-14 12:43:58,797][102037] Initializing env for player 0, init_info: {'port': 40700}... +[2023-09-14 12:43:58,797][102040] Using port 40900 on host... +[2023-09-14 12:43:58,798][102001] Using port 40300 on host... +[2023-09-14 12:43:58,803][102039] Port 40800 is available +[2023-09-14 12:43:58,803][102039] Using port 40800 +[2023-09-14 12:43:58,812][102040] Initializing env for player 1, init_info: {'port': 40900}... +[2023-09-14 12:43:58,813][102046] Initializing env for player 1, init_info: {'port': 42000}... +[2023-09-14 12:43:58,815][102001] Initializing env for player 1, init_info: {'port': 40300}... +[2023-09-14 12:43:58,816][102005] Initializing env for player 1, init_info: {'port': 40600}... +[2023-09-14 12:43:58,818][102004] Initializing env for player 1, init_info: {'port': 40500}... +[2023-09-14 12:43:58,845][102037] Using port 40700 on host... +[2023-09-14 12:43:58,853][102037] Initializing env for player 1, init_info: {'port': 40700}... +[2023-09-14 12:43:59,578][109198] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 10084352. Throughput: 0: nan, 1: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:43:59,865][102001] Initialized w:0 v:0 player:1 +[2023-09-14 12:43:59,866][102001] Initialized w:0 v:0 player:0 +[2023-09-14 12:43:59,868][102001] 2 agent workers initialized for env 0! +[2023-09-14 12:43:59,880][102001] Decorrelating experience for 0 frames... +[2023-09-14 12:43:59,881][102001] Port 40301 is available +[2023-09-14 12:43:59,881][102001] Using port 40301 +[2023-09-14 12:43:59,881][102001] Initializing env for player 0, init_info: {'port': 40301}... +[2023-09-14 12:43:59,906][102003] Initializing env for player 0, init_info: {'port': 40400}... +[2023-09-14 12:43:59,911][102001] Using port 40301 on host... +[2023-09-14 12:43:59,932][102001] Initializing env for player 1, init_info: {'port': 40301}... +[2023-09-14 12:43:59,943][102004] Initialized w:2 v:0 player:1 +[2023-09-14 12:43:59,944][102004] Initialized w:2 v:0 player:0 +[2023-09-14 12:43:59,945][102004] 2 agent workers initialized for env 2! +[2023-09-14 12:43:59,947][102003] Using port 40400 on host... +[2023-09-14 12:43:59,952][102040] Initialized w:6 v:0 player:0 +[2023-09-14 12:43:59,952][102040] Initialized w:6 v:0 player:1 +[2023-09-14 12:43:59,954][102040] 2 agent workers initialized for env 6! +[2023-09-14 12:43:59,954][102046] Initialized w:7 v:0 player:0 +[2023-09-14 12:43:59,955][102004] Decorrelating experience for 0 frames... +[2023-09-14 12:43:59,955][102046] Initialized w:7 v:0 player:1 +[2023-09-14 12:43:59,956][102004] Port 40501 is available +[2023-09-14 12:43:59,956][102004] Using port 40501 +[2023-09-14 12:43:59,956][102004] Initializing env for player 0, init_info: {'port': 40501}... +[2023-09-14 12:43:59,956][102005] Initialized w:3 v:0 player:1 +[2023-09-14 12:43:59,957][102046] 2 agent workers initialized for env 7! +[2023-09-14 12:43:59,957][102005] Initialized w:3 v:0 player:0 +[2023-09-14 12:43:59,957][102003] Initializing env for player 1, init_info: {'port': 40400}... +[2023-09-14 12:43:59,958][102005] 2 agent workers initialized for env 3! +[2023-09-14 12:43:59,964][102040] Decorrelating experience for 0 frames... +[2023-09-14 12:43:59,964][102040] Port 40901 is available +[2023-09-14 12:43:59,965][102040] Using port 40901 +[2023-09-14 12:43:59,966][102039] Initializing env for player 0, init_info: {'port': 40800}... +[2023-09-14 12:43:59,973][102005] Decorrelating experience for 0 frames... +[2023-09-14 12:43:59,973][102005] Port 40601 is available +[2023-09-14 12:43:59,973][102005] Using port 40601 +[2023-09-14 12:43:59,974][102005] Initializing env for player 0, init_info: {'port': 40601}... +[2023-09-14 12:43:59,974][102046] Decorrelating experience for 0 frames... +[2023-09-14 12:43:59,975][102046] UDP port 41001 cannot be used [Errno 98] Address already in use +[2023-09-14 12:43:59,975][102046] Port 42001 is available +[2023-09-14 12:43:59,975][102046] Using port 42001 +[2023-09-14 12:43:59,976][102046] Initializing env for player 0, init_info: {'port': 42001}... +[2023-09-14 12:43:59,986][102004] Using port 40501 on host... +[2023-09-14 12:43:59,987][102037] Initialized w:4 v:0 player:1 +[2023-09-14 12:43:59,988][102037] Initialized w:4 v:0 player:0 +[2023-09-14 12:43:59,989][102037] 2 agent workers initialized for env 4! +[2023-09-14 12:43:59,999][102037] Decorrelating experience for 0 frames... +[2023-09-14 12:44:00,003][102005] Using port 40601 on host... +[2023-09-14 12:44:00,006][102046] Using port 42001 on host... +[2023-09-14 12:44:00,007][102037] Port 40701 is available +[2023-09-14 12:44:00,007][102037] Using port 40701 +[2023-09-14 12:44:00,007][102004] Initializing env for player 1, init_info: {'port': 40501}... +[2023-09-14 12:44:00,008][102037] Initializing env for player 0, init_info: {'port': 40701}... +[2023-09-14 12:44:00,013][102039] Using port 40800 on host... +[2023-09-14 12:44:00,020][102039] Initializing env for player 1, init_info: {'port': 40800}... +[2023-09-14 12:44:00,024][102005] Initializing env for player 1, init_info: {'port': 40601}... +[2023-09-14 12:44:00,026][102046] Initializing env for player 1, init_info: {'port': 42001}... +[2023-09-14 12:44:00,053][102037] Using port 40701 on host... +[2023-09-14 12:44:00,059][102037] Initializing env for player 1, init_info: {'port': 40701}... +[2023-09-14 12:44:01,027][102004] Initialized w:2 v:1 player:1 +[2023-09-14 12:44:01,028][102004] Initialized w:2 v:1 player:0 +[2023-09-14 12:44:01,030][102004] 2 agent workers initialized for env 2! +[2023-09-14 12:44:01,042][102004] Decorrelating experience for 32 frames... +[2023-09-14 12:44:01,059][102001] Initialized w:0 v:1 player:1 +[2023-09-14 12:44:01,060][102001] Initialized w:0 v:1 player:0 +[2023-09-14 12:44:01,062][102001] 2 agent workers initialized for env 0! +[2023-09-14 12:44:01,073][102001] Decorrelating experience for 32 frames... +[2023-09-14 12:44:01,076][102040] Initializing env for player 0, init_info: {'port': 40901}... +[2023-09-14 12:44:01,080][102046] Initialized w:7 v:1 player:1 +[2023-09-14 12:44:01,081][102046] Initialized w:7 v:1 player:0 +[2023-09-14 12:44:01,082][102046] 2 agent workers initialized for env 7! +[2023-09-14 12:44:01,098][102046] Decorrelating experience for 32 frames... +[2023-09-14 12:44:01,113][102040] Using port 40901 on host... +[2023-09-14 12:44:01,116][102004] Multi agent env, num agents: 2 +[2023-09-14 12:44:01,126][102040] Initializing env for player 1, init_info: {'port': 40901}... +[2023-09-14 12:44:01,129][102039] Initialized w:5 v:0 player:1 +[2023-09-14 12:44:01,131][102039] Initialized w:5 v:0 player:0 +[2023-09-14 12:44:01,132][102039] 2 agent workers initialized for env 5! +[2023-09-14 12:44:01,156][102003] Initialized w:1 v:0 player:1 +[2023-09-14 12:44:01,158][102003] Initialized w:1 v:0 player:0 +[2023-09-14 12:44:01,159][102003] 2 agent workers initialized for env 1! +[2023-09-14 12:44:01,161][102004] Multi agent env, num agents: 2 +[2023-09-14 12:44:01,164][102039] Decorrelating experience for 0 frames... +[2023-09-14 12:44:01,169][102003] Decorrelating experience for 0 frames... +[2023-09-14 12:44:01,169][102005] Initialized w:3 v:1 player:1 +[2023-09-14 12:44:01,169][102005] Initialized w:3 v:1 player:0 +[2023-09-14 12:44:01,169][102037] Initialized w:4 v:1 player:0 +[2023-09-14 12:44:01,170][102037] Initialized w:4 v:1 player:1 +[2023-09-14 12:44:01,170][102005] 2 agent workers initialized for env 3! +[2023-09-14 12:44:01,171][102037] 2 agent workers initialized for env 4! +[2023-09-14 12:44:01,176][102001] Multi agent env, num agents: 2 +[2023-09-14 12:44:01,180][102037] Decorrelating experience for 32 frames... +[2023-09-14 12:44:01,188][102005] Decorrelating experience for 32 frames... +[2023-09-14 12:44:01,197][102046] Multi agent env, num agents: 2 +[2023-09-14 12:44:01,214][102001] Multi agent env, num agents: 2 +[2023-09-14 12:44:01,215][102039] Port 40801 is available +[2023-09-14 12:44:01,215][102003] Port 40401 is available +[2023-09-14 12:44:01,216][102039] Using port 40801 +[2023-09-14 12:44:01,216][102003] Using port 40401 +[2023-09-14 12:44:01,215][102004] Port 40502 is available +[2023-09-14 12:44:01,216][102004] Using port 40502 +[2023-09-14 12:44:01,216][102039] Initializing env for player 0, init_info: {'port': 40801}... +[2023-09-14 12:44:01,216][102003] Initializing env for player 0, init_info: {'port': 40401}... +[2023-09-14 12:44:01,216][102004] Initializing env for player 0, init_info: {'port': 40502}... +[2023-09-14 12:44:01,237][102046] Multi agent env, num agents: 2 +[2023-09-14 12:44:01,251][102004] Using port 40502 on host... +[2023-09-14 12:44:01,251][102001] Port 40302 is available +[2023-09-14 12:44:01,252][102001] Using port 40302 +[2023-09-14 12:44:01,257][102037] Multi agent env, num agents: 2 +[2023-09-14 12:44:01,266][102039] Initializing env for player 1, init_info: {'port': 40801}... +[2023-09-14 12:44:01,267][102003] Initializing env for player 1, init_info: {'port': 40401}... +[2023-09-14 12:44:01,267][102004] Initializing env for player 1, init_info: {'port': 40502}... +[2023-09-14 12:44:01,271][102039] Using port 40801 on host... +[2023-09-14 12:44:01,273][102046] UDP port 41002 cannot be used [Errno 98] Address already in use +[2023-09-14 12:44:01,274][102003] Using port 40401 on host... +[2023-09-14 12:44:01,274][102046] Port 42002 is available +[2023-09-14 12:44:01,274][102046] Using port 42002 +[2023-09-14 12:44:01,274][102046] Initializing env for player 0, init_info: {'port': 42002}... +[2023-09-14 12:44:01,278][102005] Multi agent env, num agents: 2 +[2023-09-14 12:44:01,289][102037] Multi agent env, num agents: 2 +[2023-09-14 12:44:01,303][102046] Using port 42002 on host... +[2023-09-14 12:44:01,318][102037] Port 40702 is available +[2023-09-14 12:44:01,318][102037] Using port 40702 +[2023-09-14 12:44:01,319][102037] Initializing env for player 0, init_info: {'port': 40702}... +[2023-09-14 12:44:01,325][102005] Multi agent env, num agents: 2 +[2023-09-14 12:44:01,325][102046] Initializing env for player 1, init_info: {'port': 42002}... +[2023-09-14 12:44:01,348][102037] Using port 40702 on host... +[2023-09-14 12:44:01,369][102037] Initializing env for player 1, init_info: {'port': 40702}... +[2023-09-14 12:44:01,371][102005] Port 40602 is available +[2023-09-14 12:44:01,371][102005] Using port 40602 +[2023-09-14 12:44:01,371][102005] Initializing env for player 0, init_info: {'port': 40602}... +[2023-09-14 12:44:01,405][102005] Using port 40602 on host... +[2023-09-14 12:44:01,422][102005] Initializing env for player 1, init_info: {'port': 40602}... +[2023-09-14 12:44:02,306][102040] Initialized w:6 v:1 player:0 +[2023-09-14 12:44:02,307][102040] Initialized w:6 v:1 player:1 +[2023-09-14 12:44:02,309][102040] 2 agent workers initialized for env 6! +[2023-09-14 12:44:02,312][102001] Initializing env for player 0, init_info: {'port': 40302}... +[2023-09-14 12:44:02,323][102040] Decorrelating experience for 32 frames... +[2023-09-14 12:44:02,346][102001] Using port 40302 on host... +[2023-09-14 12:44:02,363][102001] Initializing env for player 1, init_info: {'port': 40302}... +[2023-09-14 12:44:02,374][102003] Initialized w:1 v:1 player:1 +[2023-09-14 12:44:02,375][102003] Initialized w:1 v:1 player:0 +[2023-09-14 12:44:02,377][102003] 2 agent workers initialized for env 1! +[2023-09-14 12:44:02,387][102003] Decorrelating experience for 32 frames... +[2023-09-14 12:44:02,392][102037] Initialized w:4 v:2 player:0 +[2023-09-14 12:44:02,393][102037] Initialized w:4 v:2 player:1 +[2023-09-14 12:44:02,394][102037] 2 agent workers initialized for env 4! +[2023-09-14 12:44:02,394][102004] Initialized w:2 v:2 player:1 +[2023-09-14 12:44:02,394][102004] Initialized w:2 v:2 player:0 +[2023-09-14 12:44:02,396][102004] 2 agent workers initialized for env 2! +[2023-09-14 12:44:02,396][102040] Multi agent env, num agents: 2 +[2023-09-14 12:44:02,403][102004] Decorrelating experience for 64 frames... +[2023-09-14 12:44:02,404][102037] Decorrelating experience for 64 frames... +[2023-09-14 12:44:02,432][102040] Multi agent env, num agents: 2 +[2023-09-14 12:44:02,463][102003] Multi agent env, num agents: 2 +[2023-09-14 12:44:02,468][102040] Port 40902 is available +[2023-09-14 12:44:02,468][102040] Using port 40902 +[2023-09-14 12:44:02,469][102040] Initializing env for player 0, init_info: {'port': 40902}... +[2023-09-14 12:44:02,490][102046] Initialized w:7 v:2 player:0 +[2023-09-14 12:44:02,491][102046] Initialized w:7 v:2 player:1 +[2023-09-14 12:44:02,492][102046] 2 agent workers initialized for env 7! +[2023-09-14 12:44:02,502][102046] Decorrelating experience for 64 frames... +[2023-09-14 12:44:02,505][102040] Using port 40902 on host... +[2023-09-14 12:44:02,509][102003] Multi agent env, num agents: 2 +[2023-09-14 12:44:02,519][102040] Initializing env for player 1, init_info: {'port': 40902}... +[2023-09-14 12:44:02,530][102005] Initialized w:3 v:2 player:1 +[2023-09-14 12:44:02,531][102005] Initialized w:3 v:2 player:0 +[2023-09-14 12:44:02,532][102005] 2 agent workers initialized for env 3! +[2023-09-14 12:44:02,537][102004] Port 40503 is available +[2023-09-14 12:44:02,537][102004] Using port 40503 +[2023-09-14 12:44:02,537][102004] Initializing env for player 0, init_info: {'port': 40503}... +[2023-09-14 12:44:02,542][102005] Decorrelating experience for 64 frames... +[2023-09-14 12:44:02,554][102003] Port 40402 is available +[2023-09-14 12:44:02,554][102003] Using port 40402 +[2023-09-14 12:44:02,555][102037] Port 40703 is available +[2023-09-14 12:44:02,555][102003] Initializing env for player 0, init_info: {'port': 40402}... +[2023-09-14 12:44:02,555][102037] Using port 40703 +[2023-09-14 12:44:02,555][102037] Initializing env for player 0, init_info: {'port': 40703}... +[2023-09-14 12:44:02,567][102004] Using port 40503 on host... +[2023-09-14 12:44:02,581][102039] Initialized w:5 v:1 player:1 +[2023-09-14 12:44:02,581][102039] Initialized w:5 v:1 player:0 +[2023-09-14 12:44:02,582][102039] 2 agent workers initialized for env 5! +[2023-09-14 12:44:02,585][102037] Using port 40703 on host... +[2023-09-14 12:44:02,588][102004] Initializing env for player 1, init_info: {'port': 40503}... +[2023-09-14 12:44:02,592][102039] Decorrelating experience for 32 frames... +[2023-09-14 12:44:02,600][102003] Using port 40402 on host... +[2023-09-14 12:44:02,606][102037] Initializing env for player 1, init_info: {'port': 40703}... +[2023-09-14 12:44:02,607][102003] Initializing env for player 1, init_info: {'port': 40402}... +[2023-09-14 12:44:02,648][102046] Port 41003 is available +[2023-09-14 12:44:02,649][102046] Using port 41003 +[2023-09-14 12:44:02,649][102046] Initializing env for player 0, init_info: {'port': 41003}... +[2023-09-14 12:44:02,679][102039] Multi agent env, num agents: 2 +[2023-09-14 12:44:02,684][102046] Using port 41003 on host... +[2023-09-14 12:44:02,700][102046] Initializing env for player 1, init_info: {'port': 41003}... +[2023-09-14 12:44:02,700][102005] Port 40603 is available +[2023-09-14 12:44:02,701][102005] Using port 40603 +[2023-09-14 12:44:02,724][102039] Multi agent env, num agents: 2 +[2023-09-14 12:44:02,770][102039] Port 40802 is available +[2023-09-14 12:44:02,770][102039] Using port 40802 +[2023-09-14 12:44:02,770][102039] Initializing env for player 0, init_info: {'port': 40802}... +[2023-09-14 12:44:02,803][102039] Using port 40802 on host... +[2023-09-14 12:44:02,821][102039] Initializing env for player 1, init_info: {'port': 40802}... +[2023-09-14 12:44:03,405][102001] Initialized w:0 v:2 player:1 +[2023-09-14 12:44:03,406][102001] Initialized w:0 v:2 player:0 +[2023-09-14 12:44:03,408][102001] 2 agent workers initialized for env 0! +[2023-09-14 12:44:03,424][102001] Decorrelating experience for 64 frames... +[2023-09-14 12:44:03,542][102001] Port 40303 is available +[2023-09-14 12:44:03,542][102001] Using port 40303 +[2023-09-14 12:44:03,543][102001] Initializing env for player 0, init_info: {'port': 40303}... +[2023-09-14 12:44:03,569][102040] Initialized w:6 v:2 player:1 +[2023-09-14 12:44:03,571][102040] Initialized w:6 v:2 player:0 +[2023-09-14 12:44:03,571][102001] Using port 40303 on host... +[2023-09-14 12:44:03,572][102040] 2 agent workers initialized for env 6! +[2023-09-14 12:44:03,581][102040] Decorrelating experience for 64 frames... +[2023-09-14 12:44:03,593][102001] Initializing env for player 1, init_info: {'port': 40303}... +[2023-09-14 12:44:03,630][102004] Initialized w:2 v:3 player:0 +[2023-09-14 12:44:03,632][102004] Initialized w:2 v:3 player:1 +[2023-09-14 12:44:03,632][102004] 2 agent workers initialized for env 2! +[2023-09-14 12:44:03,641][102004] Decorrelating experience for 96 frames... +[2023-09-14 12:44:03,720][102046] Initialized w:7 v:3 player:1 +[2023-09-14 12:44:03,721][102046] Initialized w:7 v:3 player:0 +[2023-09-14 12:44:03,722][102046] 2 agent workers initialized for env 7! +[2023-09-14 12:44:03,727][102040] Port 40903 is available +[2023-09-14 12:44:03,728][102040] Using port 40903 +[2023-09-14 12:44:03,728][102040] Initializing env for player 0, init_info: {'port': 40903}... +[2023-09-14 12:44:03,730][102046] Decorrelating experience for 96 frames... +[2023-09-14 12:44:03,740][102037] Initialized w:4 v:3 player:0 +[2023-09-14 12:44:03,742][102037] Initialized w:4 v:3 player:1 +[2023-09-14 12:44:03,743][102037] 2 agent workers initialized for env 4! +[2023-09-14 12:44:03,745][102003] Initialized w:1 v:2 player:0 +[2023-09-14 12:44:03,745][102003] Initialized w:1 v:2 player:1 +[2023-09-14 12:44:03,746][102003] 2 agent workers initialized for env 1! +[2023-09-14 12:44:03,752][102037] Decorrelating experience for 96 frames... +[2023-09-14 12:44:03,756][102003] Decorrelating experience for 64 frames... +[2023-09-14 12:44:03,760][102005] Initializing env for player 0, init_info: {'port': 40603}... +[2023-09-14 12:44:03,763][102040] Using port 40903 on host... +[2023-09-14 12:44:03,779][102040] Initializing env for player 1, init_info: {'port': 40903}... +[2023-09-14 12:44:03,796][102005] Using port 40603 on host... +[2023-09-14 12:44:03,810][102005] Initializing env for player 1, init_info: {'port': 40603}... +[2023-09-14 12:44:03,855][102039] Initialized w:5 v:2 player:0 +[2023-09-14 12:44:03,856][102039] Initialized w:5 v:2 player:1 +[2023-09-14 12:44:03,857][102039] 2 agent workers initialized for env 5! +[2023-09-14 12:44:03,867][102039] Decorrelating experience for 64 frames... +[2023-09-14 12:44:03,910][102003] Port 40403 is available +[2023-09-14 12:44:03,910][102003] Using port 40403 +[2023-09-14 12:44:03,910][102003] Initializing env for player 0, init_info: {'port': 40403}... +[2023-09-14 12:44:03,946][102003] Using port 40403 on host... +[2023-09-14 12:44:03,961][102003] Initializing env for player 1, init_info: {'port': 40403}... +[2023-09-14 12:44:04,036][102039] Port 40803 is available +[2023-09-14 12:44:04,036][102039] Using port 40803 +[2023-09-14 12:44:04,037][102039] Initializing env for player 0, init_info: {'port': 40803}... +[2023-09-14 12:44:04,082][102039] Using port 40803 on host... +[2023-09-14 12:44:04,088][102039] Initializing env for player 1, init_info: {'port': 40803}... +[2023-09-14 12:44:04,577][109198] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 10084352. Throughput: 0: 0.0, 1: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) +[2023-09-14 12:44:04,658][102001] Initialized w:0 v:3 player:1 +[2023-09-14 12:44:04,668][102001] Initialized w:0 v:3 player:0 +[2023-09-14 12:44:04,669][102001] 2 agent workers initialized for env 0! +[2023-09-14 12:44:04,679][102001] Decorrelating experience for 96 frames... +[2023-09-14 12:44:04,805][102040] Initialized w:6 v:3 player:0 +[2023-09-14 12:44:04,805][102040] Initialized w:6 v:3 player:1 +[2023-09-14 12:44:04,807][102040] 2 agent workers initialized for env 6! +[2023-09-14 12:44:04,816][102040] Decorrelating experience for 96 frames... +[2023-09-14 12:44:04,880][102005] Initialized w:3 v:3 player:0 +[2023-09-14 12:44:04,880][102005] Initialized w:3 v:3 player:1 +[2023-09-14 12:44:04,882][102005] 2 agent workers initialized for env 3! +[2023-09-14 12:44:04,892][102005] Decorrelating experience for 96 frames... +[2023-09-14 12:44:05,112][102003] Initialized w:1 v:3 player:1 +[2023-09-14 12:44:05,112][102003] Initialized w:1 v:3 player:0 +[2023-09-14 12:44:05,114][102003] 2 agent workers initialized for env 1! +[2023-09-14 12:44:05,124][102003] Decorrelating experience for 96 frames... +[2023-09-14 12:44:05,187][102039] Initialized w:5 v:3 player:0 +[2023-09-14 12:44:05,188][102039] Initialized w:5 v:3 player:1 +[2023-09-14 12:44:05,189][102039] 2 agent workers initialized for env 5! +[2023-09-14 12:44:05,199][102039] Decorrelating experience for 96 frames... +[2023-09-14 12:44:06,379][101718] Signal inference workers to stop experience collection... +[2023-09-14 12:44:06,387][101965] InferenceWorker_p0-w0: stopping experience collection +[2023-09-14 12:44:06,398][101964] InferenceWorker_p1-w0: stopping experience collection +[2023-09-14 12:44:09,372][101718] Signal inference workers to resume experience collection... +[2023-09-14 12:44:09,373][101964] InferenceWorker_p1-w0: resuming experience collection +[2023-09-14 12:44:09,373][101965] InferenceWorker_p0-w0: resuming experience collection +[2023-09-14 12:44:09,578][109198] Fps is (10 sec: 819.2, 60 sec: 819.2, 300 sec: 819.2). Total num frames: 10092544. Throughput: 0: 257.0, 1: 216.0. Samples: 4730. Policy #0 lag: (min: 0.0, avg: 0.0, max: 0.0) +[2023-09-14 12:44:10,863][101802] Signal inference workers to stop experience collection... +[2023-09-14 12:44:11,525][101802] Signal inference workers to resume experience collection... +[2023-09-14 12:44:11,871][109198] Heartbeat connected on Batcher_0 +[2023-09-14 12:44:11,874][109198] Heartbeat connected on Batcher_1 +[2023-09-14 12:44:11,893][109198] Heartbeat connected on InferenceWorker_p1-w0 +[2023-09-14 12:44:11,895][109198] Heartbeat connected on RolloutWorker_w1 +[2023-09-14 12:44:11,898][109198] Heartbeat connected on RolloutWorker_w2 +[2023-09-14 12:44:11,899][109198] Heartbeat connected on RolloutWorker_w0 +[2023-09-14 12:44:11,900][109198] Heartbeat connected on RolloutWorker_w3 +[2023-09-14 12:44:11,906][109198] Heartbeat connected on RolloutWorker_w5 +[2023-09-14 12:44:11,909][109198] Heartbeat connected on RolloutWorker_w6 +[2023-09-14 12:44:11,912][109198] Heartbeat connected on RolloutWorker_w7 +[2023-09-14 12:44:11,913][109198] Heartbeat connected on RolloutWorker_w4 +[2023-09-14 12:44:11,942][109198] Heartbeat connected on LearnerWorker_p0 +[2023-09-14 12:44:11,950][109198] Heartbeat connected on InferenceWorker_p0-w0 +[2023-09-14 12:44:11,989][109198] Heartbeat connected on LearnerWorker_p1 +[2023-09-14 12:44:14,577][109198] Fps is (10 sec: 6553.6, 60 sec: 4369.1, 300 sec: 4369.1). Total num frames: 10149888. Throughput: 0: 548.7, 1: 450.3. Samples: 14984. Policy #0 lag: (min: 0.0, avg: 0.7, max: 3.0) +[2023-09-14 12:44:15,036][101965] Updated weights for policy 0, policy_version 1635 (0.0700) +[2023-09-14 12:44:16,264][101964] Updated weights for policy 1, policy_version 847 (0.0013) +[2023-09-14 12:44:19,577][109198] Fps is (10 sec: 12288.2, 60 sec: 6553.6, 300 sec: 6553.6). Total num frames: 10215424. Throughput: 0: 710.2, 1: 568.4. Samples: 25571. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:44:20,126][101965] Updated weights for policy 0, policy_version 1645 (0.0012) +[2023-09-14 12:44:22,804][101964] Updated weights for policy 1, policy_version 857 (0.0012) +[2023-09-14 12:44:24,577][109198] Fps is (10 sec: 13926.3, 60 sec: 8192.1, 300 sec: 8192.1). Total num frames: 10289152. Throughput: 0: 1052.6, 1: 832.5. Samples: 47129. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:44:25,131][101965] Updated weights for policy 0, policy_version 1655 (0.0013) +[2023-09-14 12:44:29,147][101964] Updated weights for policy 1, policy_version 867 (0.0011) +[2023-09-14 12:44:29,577][109198] Fps is (10 sec: 14745.7, 60 sec: 9284.3, 300 sec: 9284.3). Total num frames: 10362880. Throughput: 0: 1288.0, 1: 1013.3. Samples: 69038. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:44:30,197][101965] Updated weights for policy 0, policy_version 1665 (0.0013) +[2023-09-14 12:44:34,577][109198] Fps is (10 sec: 15155.3, 60 sec: 10181.6, 300 sec: 10181.6). Total num frames: 10440704. Throughput: 0: 1278.6, 1: 1004.8. Samples: 79918. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:44:35,158][101965] Updated weights for policy 0, policy_version 1675 (0.0012) +[2023-09-14 12:44:35,721][101964] Updated weights for policy 1, policy_version 877 (0.0014) +[2023-09-14 12:44:39,577][109198] Fps is (10 sec: 14745.6, 60 sec: 10649.6, 300 sec: 10649.6). Total num frames: 10510336. Throughput: 0: 1427.3, 1: 1117.5. Samples: 101792. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:44:39,933][102037] DAMAGECOUNT value on done: 130.0 +[2023-09-14 12:44:39,933][102037] DAMAGECOUNT value on done: 183.0 +[2023-09-14 12:44:39,934][102037] Sum rewards: 3.787, reward structure: {'HEALTH': '-1.780', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.052', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.278', 'WEAPON3': '0.400', 'weapon4': '0.532', 'FRAGCOUNT': '1.000', 'weapon3': '1.244', 'DAMAGECOUNT': '1.300', 'weapon5': '1.406'} +[2023-09-14 12:44:39,934][102037] Sum rewards: 3.610, reward structure: {'HEALTH': '-1.250', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.025', 'AMMO3': '0.030', 'AMMO4': '0.125', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.406', 'weapon4': '0.870', 'FRAGCOUNT': '1.000', 'weapon3': '1.074', 'DAMAGECOUNT': '1.830'} +[2023-09-14 12:44:40,104][101965] Updated weights for policy 0, policy_version 1685 (0.0013) +[2023-09-14 12:44:40,164][102037] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:44:40,499][102037] DAMAGECOUNT value on done: 155.0 +[2023-09-14 12:44:40,500][102037] DAMAGECOUNT value on done: 220.0 +[2023-09-14 12:44:40,500][102037] Sum rewards: 0.889, reward structure: {'HEALTH': '-2.150', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.011', 'weapon2': '0.034', 'AMMO3': '0.050', 'AMMO4': '0.055', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'weapon4': '0.608', 'FRAGCOUNT': '1.000', 'weapon3': '1.030', 'DAMAGECOUNT': '1.550'} +[2023-09-14 12:44:40,501][102037] Sum rewards: 5.706, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.017', 'AMMO3': '0.042', 'AMMO4': '0.086', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.216', 'WEAPON3': '0.400', 'weapon4': '0.630', 'weapon5': '0.994', 'weapon3': '1.316', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.200'} +[2023-09-14 12:44:42,368][101964] Updated weights for policy 1, policy_version 887 (0.0013) +[2023-09-14 12:44:42,446][102005] DAMAGECOUNT value on done: 20.0 +[2023-09-14 12:44:42,446][102005] DAMAGECOUNT value on done: 40.0 +[2023-09-14 12:44:42,638][102005] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:44:43,005][102005] DAMAGECOUNT value on done: 175.0 +[2023-09-14 12:44:43,006][102005] DAMAGECOUNT value on done: 215.0 +[2023-09-14 12:44:43,006][102005] Sum rewards: 4.381, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.017', 'AMMO3': '0.066', 'AMMO4': '0.084', 'weapon2': '0.132', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon5': '0.510', 'weapon4': '0.916', 'DAMAGECOUNT': '1.750', 'weapon3': '1.896', 'FRAGCOUNT': '2.000'} +[2023-09-14 12:44:43,006][102005] Sum rewards: 5.122, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.037', 'AMMO3': '0.070', 'weapon2': '0.096', 'weapon5': '0.102', 'AMMO4': '0.185', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.344', 'WEAPON3': '0.600', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150', 'weapon3': '2.924'} +[2023-09-14 12:44:44,125][102046] DAMAGECOUNT value on done: 205.0 +[2023-09-14 12:44:44,126][102046] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:44:44,126][102046] Sum rewards: 6.918, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.013', 'AMMO3': '0.049', 'AMMO4': '0.065', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.278', 'weapon2': '0.356', 'WEAPON3': '0.400', 'weapon3': '1.532', 'weapon5': '1.764', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:44:44,127][102046] Sum rewards: 2.750, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.012', 'AMMO3': '0.057', 'AMMO4': '0.061', 'WEAPON4': '0.100', 'weapon4': '0.126', 'WEAPON5': '0.200', 'weapon2': '0.390', 'WEAPON3': '0.500', 'weapon5': '0.676', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '2.618'} +[2023-09-14 12:44:44,207][102037] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:44:44,207][102037] DAMAGECOUNT value on done: 55.0 +[2023-09-14 12:44:44,208][102037] Sum rewards: 4.976, reward structure: {'HEALTH': '-0.550', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.025', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.124', 'WEAPON3': '0.200', 'weapon2': '0.448', 'weapon3': '0.614', 'weapon4': '0.628', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon5': '1.212'} +[2023-09-14 12:44:44,323][102046] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:44:44,577][109198] Fps is (10 sec: 14335.9, 60 sec: 11104.8, 300 sec: 11104.8). Total num frames: 10584064. Throughput: 0: 1552.6, 1: 1195.6. Samples: 123671. Policy #0 lag: (min: 0.0, avg: 0.9, max: 2.0) +[2023-09-14 12:44:44,579][109198] Avg episode reward: [(0, '4.096'), (1, '3.648')] +[2023-09-14 12:44:44,581][101802] Saving new best policy, reward=3.648! +[2023-09-14 12:44:44,726][102046] DAMAGECOUNT value on done: 360.0 +[2023-09-14 12:44:44,726][102046] DAMAGECOUNT value on done: 145.0 +[2023-09-14 12:44:44,727][102046] Sum rewards: 9.184, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.054', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.422', 'weapon3': '1.454', 'weapon5': '2.074', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.600'} +[2023-09-14 12:44:44,822][102037] DAMAGECOUNT value on done: 159.0 +[2023-09-14 12:44:44,823][102037] DAMAGECOUNT value on done: 260.0 +[2023-09-14 12:44:44,823][102037] Sum rewards: 2.188, reward structure: {'HEALTH': '-2.900', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.030', 'AMMO2': '-0.006', 'HITCOUNT': '0.000', 'AMMO5': '0.012', 'AMMO3': '0.073', 'WEAPON5': '0.300', 'weapon5': '0.436', 'weapon2': '0.482', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.590', 'weapon3': '2.630'} +[2023-09-14 12:44:44,824][102037] Sum rewards: 7.084, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.015', 'AMMO3': '0.039', 'weapon2': '0.042', 'AMMO4': '0.074', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.726', 'weapon5': '0.776', 'FRAGCOUNT': '2.000', 'weapon3': '2.302', 'DAMAGECOUNT': '2.600'} +[2023-09-14 12:44:44,952][102004] DAMAGECOUNT value on done: 130.0 +[2023-09-14 12:44:44,952][102004] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:44:44,953][102004] Sum rewards: 4.683, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.003', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.430', 'weapon5': '0.718', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.300', 'weapon3': '2.288'} +[2023-09-14 12:44:44,953][102004] Sum rewards: 2.744, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.030', 'AMMO4': '0.049', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.276', 'weapon5': '0.286', 'WEAPON3': '0.300', 'weapon4': '0.594', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.196'} +[2023-09-14 12:44:44,987][101965] Updated weights for policy 0, policy_version 1695 (0.0013) +[2023-09-14 12:44:45,320][102039] DAMAGECOUNT value on done: 305.0 +[2023-09-14 12:44:45,320][102039] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:44:45,321][102039] Sum rewards: 8.637, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.003', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.047', 'WEAPON4': '0.100', 'weapon2': '0.142', 'WEAPON5': '0.200', 'weapon4': '0.212', 'WEAPON3': '0.400', 'weapon3': '1.640', 'weapon5': '1.888', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.050'} +[2023-09-14 12:44:45,321][102039] Sum rewards: 1.199, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.042', 'AMMO3': '0.102', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'AMMO4': '0.210', 'weapon2': '0.322', 'weapon5': '0.528', 'weapon4': '0.592', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '2.242'} +[2023-09-14 12:44:45,557][102039] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:44:45,623][102004] DAMAGECOUNT value on done: 110.0 +[2023-09-14 12:44:45,624][102004] Sum rewards: 4.572, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.049', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.412', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon5': '1.722', 'weapon3': '1.810'} +[2023-09-14 12:44:45,624][102004] DAMAGECOUNT value on done: 110.0 +[2023-09-14 12:44:45,625][102004] Sum rewards: 3.075, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.015', 'AMMO3': '0.072', 'AMMO4': '0.073', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.356', 'WEAPON3': '0.600', 'weapon4': '0.632', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.100', 'weapon5': '1.392', 'weapon3': '1.428'} +[2023-09-14 12:44:45,959][102039] DAMAGECOUNT value on done: 205.0 +[2023-09-14 12:44:45,959][102039] DAMAGECOUNT value on done: 525.0 +[2023-09-14 12:44:45,960][102039] Sum rewards: -0.292, reward structure: {'DEATHCOUNT': '-5.000', 'HEALTH': '-5.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.027', 'weapon5': '0.072', 'AMMO4': '0.133', 'AMMO3': '0.167', 'weapon2': '0.352', 'WEAPON4': '0.400', 'WEAPON5': '0.400', 'weapon4': '0.502', 'WEAPON3': '1.100', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050', 'weapon3': '2.484'} +[2023-09-14 12:44:45,960][102039] Sum rewards: 11.234, reward structure: {'HEALTH': '-2.050', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.021', 'AMMO3': '0.066', 'AMMO4': '0.105', 'WEAPON4': '0.200', 'weapon5': '0.292', 'WEAPON5': '0.300', 'weapon4': '0.390', 'weapon2': '0.402', 'WEAPON3': '0.600', 'weapon3': '2.642', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.250'} +[2023-09-14 12:44:45,982][102046] DAMAGECOUNT value on done: 105.0 +[2023-09-14 12:44:45,982][102046] DAMAGECOUNT value on done: 125.0 +[2023-09-14 12:44:45,982][102046] Sum rewards: 4.257, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.029', 'AMMO2': '-0.006', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.048', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.494', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon5': '1.484', 'weapon3': '1.806'} +[2023-09-14 12:44:45,983][102046] Sum rewards: 4.807, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.033', 'AMMO3': '0.040', 'AMMO4': '0.164', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.278', 'WEAPON3': '0.400', 'weapon4': '0.928', 'weapon5': '0.946', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.250', 'weapon3': '1.358'} +[2023-09-14 12:44:46,125][102040] DAMAGECOUNT value on done: 335.0 +[2023-09-14 12:44:46,125][102040] DAMAGECOUNT value on done: 220.0 +[2023-09-14 12:44:46,126][102040] Sum rewards: 7.040, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.010', 'AMMO4': '0.022', 'AMMO3': '0.057', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.256', 'weapon2': '0.422', 'WEAPON3': '0.500', 'weapon5': '0.752', 'weapon3': '2.266', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.350'} +[2023-09-14 12:44:46,126][102040] Sum rewards: 3.470, reward structure: {'HEALTH': '-3.250', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'weapon5': '0.034', 'AMMO2': '0.040', 'AMMO3': '0.101', 'weapon2': '0.170', 'AMMO4': '0.199', 'weapon4': '0.278', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.200', 'weapon3': '3.178'} +[2023-09-14 12:44:46,173][102004] DAMAGECOUNT value on done: 175.0 +[2023-09-14 12:44:46,173][102004] DAMAGECOUNT value on done: 277.0 +[2023-09-14 12:44:46,173][102004] Sum rewards: 2.841, reward structure: {'HEALTH': '-2.500', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.010', 'AMMO4': '0.021', 'AMMO3': '0.057', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'weapon2': '0.596', 'weapon5': '0.752', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.750', 'weapon3': '2.450'} +[2023-09-14 12:44:46,174][102004] Sum rewards: 3.282, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.022', 'AMMO3': '0.080', 'AMMO4': '0.107', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon5': '0.338', 'weapon4': '0.562', 'WEAPON3': '0.600', 'weapon2': '0.898', 'weapon3': '1.398', 'FRAGCOUNT': '1.998', 'DAMAGECOUNT': '2.770'} +[2023-09-14 12:44:46,382][102040] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:44:46,424][102004] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:44:46,445][102005] DAMAGECOUNT value on done: 110.0 +[2023-09-14 12:44:46,445][102005] DAMAGECOUNT value on done: 109.0 +[2023-09-14 12:44:46,446][102005] Sum rewards: 2.548, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO4': '0.025', 'AMMO3': '0.030', 'WEAPON4': '0.100', 'WEAPON3': '0.300', 'weapon4': '0.314', 'weapon2': '0.714', 'weapon3': '0.960', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100'} +[2023-09-14 12:44:46,446][102005] Sum rewards: 3.036, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.028', 'AMMO3': '0.035', 'WEAPON5': '0.100', 'AMMO4': '0.138', 'weapon2': '0.162', 'WEAPON4': '0.200', 'weapon5': '0.254', 'WEAPON3': '0.300', 'weapon4': '0.868', 'weapon3': '0.958', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.090'} +[2023-09-14 12:44:46,608][102046] DAMAGECOUNT value on done: 228.0 +[2023-09-14 12:44:46,608][102046] DAMAGECOUNT value on done: 390.0 +[2023-09-14 12:44:46,608][102046] Sum rewards: 1.106, reward structure: {'DEATHCOUNT': '-4.000', 'HEALTH': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.011', 'AMMO4': '0.054', 'AMMO3': '0.098', 'WEAPON5': '0.100', 'weapon2': '0.252', 'WEAPON4': '0.300', 'weapon5': '0.372', 'weapon4': '0.748', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'weapon3': '2.088', 'DAMAGECOUNT': '2.280'} +[2023-09-14 12:44:46,609][102046] Sum rewards: 7.669, reward structure: {'HEALTH': '-2.180', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.024', 'AMMO3': '0.050', 'AMMO4': '0.119', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon2': '0.520', 'weapon4': '0.800', 'weapon3': '1.636', 'DAMAGECOUNT': '3.900', 'FRAGCOUNT': '4.000'} +[2023-09-14 12:44:46,703][102003] DAMAGECOUNT value on done: 120.0 +[2023-09-14 12:44:46,703][102003] DAMAGECOUNT value on done: 140.0 +[2023-09-14 12:44:46,704][102003] Sum rewards: 3.942, reward structure: {'HEALTH': '-1.450', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.020', 'AMMO3': '0.040', 'weapon2': '0.090', 'AMMO4': '0.099', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.800', 'FRAGCOUNT': '0.999', 'weapon5': '1.112', 'DAMAGECOUNT': '1.200', 'weapon3': '1.224'} +[2023-09-14 12:44:46,732][102040] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:44:46,733][102040] DAMAGECOUNT value on done: 15.0 +[2023-09-14 12:44:46,811][102004] DAMAGECOUNT value on done: 200.0 +[2023-09-14 12:44:46,811][102004] DAMAGECOUNT value on done: 110.0 +[2023-09-14 12:44:46,812][102004] Sum rewards: 3.610, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.025', 'AMMO3': '0.050', 'AMMO4': '0.125', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon5': '0.354', 'weapon2': '0.416', 'WEAPON3': '0.500', 'FRAGCOUNT': '0.999', 'weapon4': '1.000', 'weapon3': '1.632', 'DAMAGECOUNT': '2.000'} +[2023-09-14 12:44:46,812][102004] Sum rewards: 2.956, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.032', 'AMMO2': '-0.006', 'HITCOUNT': '0.000', 'AMMO5': '0.012', 'AMMO3': '0.071', 'WEAPON5': '0.300', 'weapon2': '0.504', 'WEAPON3': '0.600', 'weapon5': '0.744', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.100', 'weapon3': '2.664'} +[2023-09-14 12:44:46,919][102003] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:44:47,025][102005] DAMAGECOUNT value on done: 85.0 +[2023-09-14 12:44:47,025][102005] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:44:47,026][102005] Sum rewards: 5.465, reward structure: {'HEALTH': '-0.850', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.790', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.120', 'weapon5': '2.080'} +[2023-09-14 12:44:47,193][102040] DAMAGECOUNT value on done: 40.0 +[2023-09-14 12:44:47,193][102040] DAMAGECOUNT value on done: 170.0 +[2023-09-14 12:44:47,194][102040] Sum rewards: 5.953, reward structure: {'HEALTH': '-0.400', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'AMMO2': '0.020', 'AMMO4': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon2': '0.120', 'WEAPON3': '0.200', 'weapon4': '0.582', 'weapon3': '0.716', 'FRAGCOUNT': '1.000', 'weapon5': '1.692', 'DAMAGECOUNT': '1.700'} +[2023-09-14 12:44:47,200][102039] DAMAGECOUNT value on done: 310.0 +[2023-09-14 12:44:47,200][102039] DAMAGECOUNT value on done: 130.0 +[2023-09-14 12:44:47,201][102039] Sum rewards: 8.154, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.010', 'AMMO3': '0.041', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.730', 'weapon5': '0.932', 'weapon3': '2.036', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.100'} +[2023-09-14 12:44:47,201][102039] Sum rewards: 0.429, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.013', 'AMMO4': '0.064', 'AMMO3': '0.081', 'WEAPON5': '0.100', 'weapon2': '0.174', 'weapon5': '0.260', 'WEAPON4': '0.400', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon4': '1.000', 'DAMAGECOUNT': '1.300', 'weapon3': '1.432'} +[2023-09-14 12:44:47,276][102003] DAMAGECOUNT value on done: 5.0 +[2023-09-14 12:44:47,277][102003] DAMAGECOUNT value on done: 55.0 +[2023-09-14 12:44:47,449][102001] DAMAGECOUNT value on done: 40.0 +[2023-09-14 12:44:47,450][102001] DAMAGECOUNT value on done: 0.0 +[2023-09-14 12:44:47,651][102001] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 12:44:47,758][102040] DAMAGECOUNT value on done: 170.0 +[2023-09-14 12:44:47,759][102040] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:44:47,759][102040] Sum rewards: 4.638, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.025', 'AMMO3': '0.043', 'WEAPON5': '0.100', 'AMMO4': '0.122', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.410', 'weapon2': '0.430', 'FRAGCOUNT': '1.000', 'weapon5': '1.000', 'weapon3': '1.204', 'DAMAGECOUNT': '1.700'} +[2023-09-14 12:44:47,760][102040] Sum rewards: 3.423, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'AMMO3': '0.040', 'AMMO4': '0.075', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.258', 'WEAPON3': '0.400', 'weapon4': '0.664', 'weapon5': '0.710', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.356'} +[2023-09-14 12:44:47,912][102039] DAMAGECOUNT value on done: 100.0 +[2023-09-14 12:44:47,912][102039] DAMAGECOUNT value on done: 81.0 +[2023-09-14 12:44:47,913][102039] Sum rewards: 4.087, reward structure: {'HEALTH': '-1.310', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.039', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.236', 'WEAPON3': '0.400', 'weapon5': '0.594', 'weapon2': '0.662', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '2.158'} +[2023-09-14 12:44:47,928][102003] DAMAGECOUNT value on done: 310.0 +[2023-09-14 12:44:47,928][102003] DAMAGECOUNT value on done: 200.0 +[2023-09-14 12:44:47,928][102003] Sum rewards: 7.609, reward structure: {'HEALTH': '-1.950', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.016', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.240', 'WEAPON3': '0.400', 'weapon5': '0.490', 'weapon2': '0.594', 'weapon3': '2.366', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.100'} +[2023-09-14 12:44:47,929][102003] Sum rewards: 1.927, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.019', 'AMMO3': '0.094', 'AMMO4': '0.096', 'WEAPON4': '0.200', 'weapon5': '0.224', 'WEAPON5': '0.300', 'weapon2': '0.318', 'weapon4': '0.458', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '2.000', 'weapon3': '2.502'} +[2023-09-14 12:44:48,053][102001] DAMAGECOUNT value on done: 135.0 +[2023-09-14 12:44:48,054][102001] DAMAGECOUNT value on done: 140.0 +[2023-09-14 12:44:48,054][102001] Sum rewards: 4.559, reward structure: {'HEALTH': '-1.350', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.025', 'AMMO3': '0.030', 'AMMO4': '0.124', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.442', 'weapon4': '0.790', 'FRAGCOUNT': '1.000', 'weapon3': '1.060', 'weapon5': '1.328', 'DAMAGECOUNT': '1.400'} +[2023-09-14 12:44:48,055][102001] Sum rewards: 2.590, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.011', 'AMMO4': '0.052', 'AMMO3': '0.066', 'WEAPON5': '0.200', 'weapon5': '0.296', 'WEAPON4': '0.300', 'weapon4': '0.492', 'weapon2': '0.570', 'WEAPON3': '0.600', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.350', 'weapon3': '1.644'} +[2023-09-14 12:44:48,474][101964] Updated weights for policy 1, policy_version 897 (0.0012) +[2023-09-14 12:44:48,608][102003] DAMAGECOUNT value on done: 120.0 +[2023-09-14 12:44:48,608][102003] DAMAGECOUNT value on done: 40.0 +[2023-09-14 12:44:48,609][102003] Sum rewards: 2.027, reward structure: {'HEALTH': '-1.850', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.013', 'AMMO3': '0.040', 'AMMO4': '0.064', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.400', 'weapon2': '0.610', 'weapon5': '1.292', 'weapon3': '1.850'} +[2023-09-14 12:44:48,752][102001] DAMAGECOUNT value on done: 94.0 +[2023-09-14 12:44:48,752][102001] DAMAGECOUNT value on done: 56.0 +[2023-09-14 12:44:49,396][102001] DAMAGECOUNT value on done: 165.0 +[2023-09-14 12:44:49,397][102001] DAMAGECOUNT value on done: 150.0 +[2023-09-14 12:44:49,397][102001] Sum rewards: 4.745, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.050', 'weapon2': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.242', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon5': '1.614', 'DAMAGECOUNT': '1.650', 'weapon3': '1.788'} +[2023-09-14 12:44:49,398][102001] Sum rewards: 4.462, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.013', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon4': '0.102', 'WEAPON5': '0.200', 'weapon2': '0.388', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon5': '1.294', 'DAMAGECOUNT': '1.500', 'weapon3': '2.012'} +[2023-09-14 12:44:49,577][109198] Fps is (10 sec: 14336.0, 60 sec: 11386.9, 300 sec: 11386.9). Total num frames: 10653696. Throughput: 0: 1671.0, 1: 1302.5. Samples: 133807. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:44:49,579][109198] Avg episode reward: [(0, '4.165'), (1, '3.407')] +[2023-09-14 12:44:50,467][101965] Updated weights for policy 0, policy_version 1705 (0.0013) +[2023-09-14 12:44:53,879][101964] Updated weights for policy 1, policy_version 907 (0.0014) +[2023-09-14 12:44:54,577][109198] Fps is (10 sec: 14336.0, 60 sec: 11692.3, 300 sec: 11692.3). Total num frames: 10727424. Throughput: 0: 1847.1, 1: 1497.8. Samples: 155247. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:44:54,579][109198] Avg episode reward: [(0, '4.165'), (1, '3.407')] +[2023-09-14 12:44:56,387][101965] Updated weights for policy 0, policy_version 1715 (0.0012) +[2023-09-14 12:44:59,186][101964] Updated weights for policy 1, policy_version 917 (0.0012) +[2023-09-14 12:44:59,577][109198] Fps is (10 sec: 14336.0, 60 sec: 11878.4, 300 sec: 11878.4). Total num frames: 10797056. Throughput: 0: 1944.7, 1: 1647.1. Samples: 176615. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:44:59,579][109198] Avg episode reward: [(0, '4.165'), (1, '3.407')] +[2023-09-14 12:45:02,898][101965] Updated weights for policy 0, policy_version 1725 (0.0013) +[2023-09-14 12:45:04,577][109198] Fps is (10 sec: 13926.4, 60 sec: 13038.9, 300 sec: 12036.0). Total num frames: 10866688. Throughput: 0: 1914.2, 1: 1659.6. Samples: 186393. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:45:04,579][109198] Avg episode reward: [(0, '4.165'), (1, '3.407')] +[2023-09-14 12:45:05,004][101964] Updated weights for policy 1, policy_version 927 (0.0014) +[2023-09-14 12:45:09,190][101965] Updated weights for policy 0, policy_version 1735 (0.0013) +[2023-09-14 12:45:09,577][109198] Fps is (10 sec: 13926.4, 60 sec: 14063.0, 300 sec: 12171.0). Total num frames: 10936320. Throughput: 0: 1868.3, 1: 1702.3. Samples: 207809. Policy #0 lag: (min: 0.0, avg: 0.7, max: 1.0) +[2023-09-14 12:45:09,579][109198] Avg episode reward: [(0, '4.165'), (1, '3.407')] +[2023-09-14 12:45:10,338][101964] Updated weights for policy 1, policy_version 937 (0.0011) +[2023-09-14 12:45:14,577][109198] Fps is (10 sec: 13926.3, 60 sec: 14267.7, 300 sec: 12288.0). Total num frames: 11005952. Throughput: 0: 1815.6, 1: 1739.8. Samples: 229032. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:45:14,579][109198] Avg episode reward: [(0, '4.165'), (1, '3.407')] +[2023-09-14 12:45:15,335][101965] Updated weights for policy 0, policy_version 1745 (0.0015) +[2023-09-14 12:45:15,918][101964] Updated weights for policy 1, policy_version 947 (0.0013) +[2023-09-14 12:45:17,617][102037] DAMAGECOUNT value on done: 305.0 +[2023-09-14 12:45:17,618][102037] DAMAGECOUNT value on done: 452.0 +[2023-09-14 12:45:17,618][102037] Sum rewards: 2.961, reward structure: {'HEALTH': '-2.690', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.014', 'AMMO2': '-0.003', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.068', 'WEAPON5': '0.300', 'weapon5': '0.304', 'WEAPON3': '0.600', 'weapon2': '0.972', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.750', 'weapon3': '2.658'} +[2023-09-14 12:45:17,619][102037] Sum rewards: 4.574, reward structure: {'HEALTH': '-2.650', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.038', 'AMMO2': '-0.008', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.052', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'weapon2': '0.642', 'weapon5': '0.790', 'FRAGCOUNT': '1.999', 'weapon3': '2.386', 'DAMAGECOUNT': '2.690'} +[2023-09-14 12:45:18,225][102037] DAMAGECOUNT value on done: 260.0 +[2023-09-14 12:45:18,226][102037] DAMAGECOUNT value on done: 345.0 +[2023-09-14 12:45:18,226][102037] Sum rewards: 4.551, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.030', 'AMMO3': '0.046', 'weapon2': '0.070', 'WEAPON5': '0.100', 'AMMO4': '0.150', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.808', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.216', 'weapon5': '1.676'} +[2023-09-14 12:45:18,227][102037] Sum rewards: 4.750, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.009', 'AMMO3': '0.030', 'AMMO4': '0.044', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.276', 'WEAPON3': '0.300', 'weapon2': '0.642', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.250', 'weapon3': '1.464', 'weapon5': '1.530'} +[2023-09-14 12:45:18,339][102037] DAMAGECOUNT value on done: 265.0 +[2023-09-14 12:45:18,339][102037] DAMAGECOUNT value on done: 345.0 +[2023-09-14 12:45:18,340][102037] Sum rewards: 4.788, reward structure: {'HEALTH': '-2.350', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.008', 'AMMO5': '0.015', 'AMMO4': '0.041', 'weapon4': '0.052', 'AMMO3': '0.073', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon5': '0.696', 'weapon2': '0.738', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100', 'weapon3': '2.414'} +[2023-09-14 12:45:18,340][102037] Sum rewards: 3.584, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.015', 'weapon2': '0.036', 'AMMO4': '0.075', 'AMMO3': '0.079', 'WEAPON4': '0.200', 'weapon5': '0.222', 'WEAPON5': '0.300', 'weapon4': '0.322', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.400', 'weapon3': '3.222'} +[2023-09-14 12:45:18,876][102037] DAMAGECOUNT value on done: 470.0 +[2023-09-14 12:45:18,876][102037] DAMAGECOUNT value on done: 339.0 +[2023-09-14 12:45:18,877][102037] Sum rewards: 5.988, reward structure: {'HEALTH': '-1.800', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.010', 'AMMO4': '0.011', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon2': '0.194', 'WEAPON5': '0.200', 'weapon4': '0.322', 'WEAPON3': '0.400', 'weapon5': '1.484', 'weapon3': '1.924', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:45:18,877][102037] Sum rewards: 3.714, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.071', 'WEAPON4': '0.100', 'weapon2': '0.218', 'weapon4': '0.228', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon5': '1.062', 'DAMAGECOUNT': '1.800', 'weapon3': '2.332'} +[2023-09-14 12:45:19,577][109198] Fps is (10 sec: 13926.5, 60 sec: 14336.0, 300 sec: 12390.4). Total num frames: 11075584. Throughput: 0: 1787.3, 1: 1757.4. Samples: 239433. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0) +[2023-09-14 12:45:19,579][109198] Avg episode reward: [(0, '4.193'), (1, '3.446')] +[2023-09-14 12:45:19,969][102005] DAMAGECOUNT value on done: 185.0 +[2023-09-14 12:45:19,969][102005] DAMAGECOUNT value on done: 265.0 +[2023-09-14 12:45:19,969][102005] Sum rewards: 3.273, reward structure: {'HEALTH': '-2.250', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.015', 'AMMO4': '0.024', 'AMMO3': '0.059', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon2': '0.380', 'weapon4': '0.596', 'WEAPON3': '0.600', 'weapon5': '0.840', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.650', 'weapon3': '1.754'} +[2023-09-14 12:45:19,970][102005] Sum rewards: 4.163, reward structure: {'HEALTH': '-2.550', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.012', 'AMMO2': '0.020', 'AMMO3': '0.057', 'weapon2': '0.092', 'AMMO4': '0.100', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.500', 'weapon4': '0.790', 'weapon5': '0.940', 'weapon3': '1.452', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.250'} +[2023-09-14 12:45:20,513][102040] DAMAGECOUNT value on done: 425.0 +[2023-09-14 12:45:20,513][102040] DAMAGECOUNT value on done: 225.0 +[2023-09-14 12:45:20,514][102040] Sum rewards: 3.203, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.015', 'AMMO3': '0.030', 'AMMO4': '0.075', 'WEAPON5': '0.100', 'weapon2': '0.102', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.694', 'DAMAGECOUNT': '0.900', 'weapon3': '0.996', 'weapon5': '1.788'} +[2023-09-14 12:45:20,514][102040] Sum rewards: 1.745, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.020', 'AMMO3': '0.030', 'DAMAGECOUNT': '0.050', 'AMMO4': '0.098', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.400', 'weapon4': '0.494', 'weapon3': '1.022', 'weapon5': '1.028'} +[2023-09-14 12:45:20,516][102005] DAMAGECOUNT value on done: 385.0 +[2023-09-14 12:45:20,517][102005] DAMAGECOUNT value on done: 620.0 +[2023-09-14 12:45:20,517][102005] Sum rewards: 0.506, reward structure: {'HEALTH': '-4.000', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.029', 'AMMO3': '0.099', 'weapon5': '0.112', 'AMMO4': '0.144', 'weapon4': '0.162', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon2': '0.558', 'WEAPON3': '0.800', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '2.100', 'weapon3': '2.988'} +[2023-09-14 12:45:20,518][102005] Sum rewards: 6.915, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.015', 'AMMO3': '0.069', 'AMMO4': '0.074', 'WEAPON5': '0.100', 'weapon5': '0.212', 'weapon2': '0.238', 'WEAPON4': '0.300', 'WEAPON3': '0.600', 'weapon4': '0.868', 'weapon3': '1.486', 'FRAGCOUNT': '2.999', 'DAMAGECOUNT': '4.050'} +[2023-09-14 12:45:21,118][101964] Updated weights for policy 1, policy_version 957 (0.0013) +[2023-09-14 12:45:21,229][102040] DAMAGECOUNT value on done: 158.0 +[2023-09-14 12:45:21,230][102040] DAMAGECOUNT value on done: 357.0 +[2023-09-14 12:45:21,230][102040] Sum rewards: 0.938, reward structure: {'HEALTH': '-3.150', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.049', 'AMMO3': '0.063', 'WEAPON5': '0.100', 'weapon2': '0.168', 'WEAPON4': '0.400', 'weapon5': '0.410', 'WEAPON3': '0.600', 'weapon4': '0.994', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.430', 'weapon3': '1.858'} +[2023-09-14 12:45:21,231][102040] Sum rewards: 7.995, reward structure: {'HEALTH': '-1.380', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.030', 'AMMO3': '0.050', 'AMMO4': '0.149', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.220', 'WEAPON3': '0.400', 'weapon4': '0.772', 'weapon3': '0.856', 'weapon5': '0.920', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.570'} +[2023-09-14 12:45:21,552][101965] Updated weights for policy 0, policy_version 1755 (0.0013) +[2023-09-14 12:45:23,120][102004] DAMAGECOUNT value on done: 260.0 +[2023-09-14 12:45:23,121][102004] DAMAGECOUNT value on done: 179.0 +[2023-09-14 12:45:23,121][102004] Sum rewards: 5.842, reward structure: {'HEALTH': '-0.790', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.019', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.772', 'FRAGCOUNT': '1.000', 'weapon3': '1.094', 'DAMAGECOUNT': '1.300', 'weapon5': '2.142'} +[2023-09-14 12:45:23,122][102004] Sum rewards: 1.737, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.016', 'AMMO4': '0.077', 'AMMO3': '0.078', 'weapon2': '0.106', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.600', 'weapon4': '0.686', 'DAMAGECOUNT': '0.790', 'weapon3': '1.262', 'weapon5': '1.814'} +[2023-09-14 12:45:23,669][102046] DAMAGECOUNT value on done: 305.0 +[2023-09-14 12:45:23,670][102046] DAMAGECOUNT value on done: 220.0 +[2023-09-14 12:45:23,670][102046] Sum rewards: 3.903, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO5': '0.010', 'AMMO2': '0.028', 'AMMO3': '0.042', 'AMMO4': '0.139', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.836', 'weapon4': '0.842', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.354'} +[2023-09-14 12:45:23,670][102046] Sum rewards: 5.073, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.010', 'AMMO3': '0.049', 'AMMO4': '0.050', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.300', 'weapon2': '0.368', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.200', 'weapon3': '1.578', 'weapon5': '1.808'} +[2023-09-14 12:45:23,672][102004] DAMAGECOUNT value on done: 210.0 +[2023-09-14 12:45:23,673][102004] DAMAGECOUNT value on done: 410.0 +[2023-09-14 12:45:23,674][102004] Sum rewards: 8.771, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.012', 'AMMO3': '0.047', 'AMMO4': '0.061', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.428', 'weapon5': '1.672', 'weapon3': '1.842', 'FRAGCOUNT': '2.999', 'DAMAGECOUNT': '3.000'} +[2023-09-14 12:45:23,964][102005] DAMAGECOUNT value on done: 314.0 +[2023-09-14 12:45:23,964][102005] DAMAGECOUNT value on done: 310.0 +[2023-09-14 12:45:23,964][102005] Sum rewards: 4.814, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.065', 'weapon2': '0.090', 'AMMO4': '0.097', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon4': '0.468', 'WEAPON3': '0.500', 'weapon5': '1.504', 'weapon3': '1.714', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:45:23,965][102005] Sum rewards: 4.964, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.022', 'weapon2': '0.036', 'AMMO3': '0.075', 'AMMO4': '0.111', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon5': '0.674', 'weapon4': '0.680', 'DAMAGECOUNT': '2.000', 'FRAGCOUNT': '2.000', 'weapon3': '2.250'} +[2023-09-14 12:45:24,147][102004] DAMAGECOUNT value on done: 412.0 +[2023-09-14 12:45:24,148][102004] DAMAGECOUNT value on done: 266.0 +[2023-09-14 12:45:24,148][102004] Sum rewards: 4.775, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'FRAGCOUNT': '0.999', 'weapon5': '1.052', 'weapon2': '1.106', 'DAMAGECOUNT': '1.350', 'weapon3': '1.650'} +[2023-09-14 12:45:24,148][102004] Sum rewards: 1.189, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO5': '0.007', 'AMMO2': '0.020', 'AMMO3': '0.052', 'AMMO4': '0.100', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon5': '0.612', 'DAMAGECOUNT': '0.910', 'weapon4': '1.058', 'weapon3': '1.528'} +[2023-09-14 12:45:24,223][102046] DAMAGECOUNT value on done: 469.0 +[2023-09-14 12:45:24,224][102046] Sum rewards: 6.042, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.010', 'AMMO4': '0.049', 'AMMO3': '0.070', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon2': '0.464', 'weapon4': '0.516', 'WEAPON3': '0.600', 'weapon5': '1.124', 'weapon3': '1.562', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '3.240'} +[2023-09-14 12:45:24,224][102046] DAMAGECOUNT value on done: 550.0 +[2023-09-14 12:45:24,225][102046] Sum rewards: 3.015, reward structure: {'HEALTH': '-2.950', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.020', 'AMMO3': '0.064', 'AMMO4': '0.101', 'weapon2': '0.116', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'WEAPON3': '0.600', 'weapon5': '0.768', 'weapon4': '0.996', 'FRAGCOUNT': '1.000', 'weapon3': '1.784', 'DAMAGECOUNT': '1.900'} +[2023-09-14 12:45:24,515][102005] DAMAGECOUNT value on done: 195.0 +[2023-09-14 12:45:24,516][102005] DAMAGECOUNT value on done: 330.0 +[2023-09-14 12:45:24,516][102005] Sum rewards: 2.067, reward structure: {'HEALTH': '-2.200', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.014', 'AMMO3': '0.059', 'AMMO4': '0.071', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon2': '0.424', 'weapon5': '0.462', 'WEAPON3': '0.500', 'weapon4': '0.634', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '1.488'} +[2023-09-14 12:45:24,517][102005] Sum rewards: 5.602, reward structure: {'HEALTH': '-1.660', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.042', 'WEAPON5': '0.200', 'weapon2': '0.386', 'WEAPON3': '0.400', 'weapon5': '0.974', 'weapon3': '1.982', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.300'} +[2023-09-14 12:45:24,577][109198] Fps is (10 sec: 14745.6, 60 sec: 14404.3, 300 sec: 12577.2). Total num frames: 11153408. Throughput: 0: 1734.6, 1: 1798.8. Samples: 260794. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:45:24,579][109198] Avg episode reward: [(0, '4.327'), (1, '3.392')] +[2023-09-14 12:45:24,580][101718] Saving new best policy, reward=4.327! +[2023-09-14 12:45:24,756][102004] DAMAGECOUNT value on done: 432.0 +[2023-09-14 12:45:24,757][102004] DAMAGECOUNT value on done: 425.0 +[2023-09-14 12:45:24,757][102004] Sum rewards: 3.479, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.016', 'AMMO4': '0.081', 'AMMO3': '0.098', 'weapon5': '0.292', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon2': '0.514', 'weapon4': '0.588', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'weapon3': '2.154', 'DAMAGECOUNT': '2.320'} +[2023-09-14 12:45:24,758][102004] Sum rewards: 6.782, reward structure: {'HEALTH': '-2.250', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.020', 'AMMO3': '0.064', 'AMMO4': '0.100', 'weapon2': '0.140', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon5': '0.584', 'WEAPON3': '0.600', 'weapon4': '0.982', 'weapon3': '1.882', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.150'} +[2023-09-14 12:45:25,101][102040] DAMAGECOUNT value on done: 580.0 +[2023-09-14 12:45:25,102][102040] DAMAGECOUNT value on done: 130.0 +[2023-09-14 12:45:25,102][102040] Sum rewards: 10.514, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.024', 'AMMO3': '0.040', 'weapon2': '0.094', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.552', 'weapon5': '0.916', 'weapon3': '1.976', 'FRAGCOUNT': '3.999', 'DAMAGECOUNT': '4.100'} +[2023-09-14 12:45:25,120][102039] DAMAGECOUNT value on done: 545.0 +[2023-09-14 12:45:25,120][102039] DAMAGECOUNT value on done: 315.0 +[2023-09-14 12:45:25,120][102039] Sum rewards: 3.508, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.013', 'AMMO3': '0.046', 'AMMO4': '0.065', 'WEAPON5': '0.100', 'weapon5': '0.104', 'weapon2': '0.192', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'weapon4': '0.698', 'weapon3': '1.184', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.400'} +[2023-09-14 12:45:25,121][102039] Sum rewards: 4.461, reward structure: {'HEALTH': '-2.350', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.017', 'AMMO3': '0.070', 'AMMO4': '0.085', 'WEAPON5': '0.100', 'WEAPON4': '0.300', 'weapon2': '0.398', 'WEAPON3': '0.600', 'weapon5': '0.648', 'weapon4': '0.824', 'weapon3': '1.666', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:45:25,629][102040] DAMAGECOUNT value on done: 310.0 +[2023-09-14 12:45:25,630][102040] DAMAGECOUNT value on done: 205.0 +[2023-09-14 12:45:25,630][102040] Sum rewards: 4.671, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'AMMO3': '0.030', 'AMMO4': '0.075', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.476', 'weapon4': '0.564', 'weapon5': '0.574', 'weapon3': '0.932', 'DAMAGECOUNT': '1.400', 'FRAGCOUNT': '2.000'} +[2023-09-14 12:45:25,631][102040] Sum rewards: 2.645, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'AMMO2': '0.014', 'AMMO3': '0.058', 'AMMO4': '0.069', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon2': '0.456', 'WEAPON3': '0.500', 'weapon4': '0.592', 'weapon5': '0.904', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.490'} +[2023-09-14 12:45:25,645][102046] DAMAGECOUNT value on done: 140.0 +[2023-09-14 12:45:25,645][102046] DAMAGECOUNT value on done: 130.0 +[2023-09-14 12:45:25,693][102039] DAMAGECOUNT value on done: 390.0 +[2023-09-14 12:45:25,693][102039] DAMAGECOUNT value on done: 715.0 +[2023-09-14 12:45:25,694][102039] Sum rewards: 3.504, reward structure: {'HEALTH': '-2.500', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.032', 'AMMO3': '0.066', 'AMMO4': '0.159', 'weapon2': '0.160', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon5': '0.344', 'WEAPON3': '0.600', 'weapon4': '0.610', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.900', 'weapon3': '2.620'} +[2023-09-14 12:45:25,694][102039] Sum rewards: 4.633, reward structure: {'HEALTH': '-1.900', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.304', 'weapon2': '0.360', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon5': '1.168', 'DAMAGECOUNT': '1.850', 'weapon3': '2.102'} +[2023-09-14 12:45:25,848][102003] DAMAGECOUNT value on done: 145.0 +[2023-09-14 12:45:25,848][102003] DAMAGECOUNT value on done: 150.0 +[2023-09-14 12:45:26,009][102001] DAMAGECOUNT value on done: 299.0 +[2023-09-14 12:45:26,009][102001] DAMAGECOUNT value on done: 266.0 +[2023-09-14 12:45:26,010][102001] Sum rewards: 4.172, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.049', 'AMMO3': '0.060', 'WEAPON5': '0.100', 'weapon2': '0.130', 'weapon5': '0.138', 'WEAPON4': '0.300', 'WEAPON3': '0.600', 'weapon4': '0.774', 'weapon3': '1.956', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:45:26,010][102001] Sum rewards: 4.567, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.015', 'AMMO4': '0.075', 'AMMO3': '0.075', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.422', 'weapon4': '0.588', 'WEAPON3': '0.600', 'weapon5': '0.896', 'weapon3': '1.388', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:45:26,172][102046] DAMAGECOUNT value on done: 433.0 +[2023-09-14 12:45:26,172][102046] DAMAGECOUNT value on done: 695.0 +[2023-09-14 12:45:26,172][102046] Sum rewards: 3.186, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.018', 'AMMO5': '0.020', 'AMMO4': '0.090', 'AMMO3': '0.109', 'WEAPON4': '0.200', 'weapon4': '0.222', 'weapon5': '0.270', 'WEAPON5': '0.400', 'weapon2': '0.504', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050', 'weapon3': '2.502'} +[2023-09-14 12:45:26,173][102046] Sum rewards: 7.011, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.015', 'AMMO3': '0.070', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'weapon4': '0.316', 'weapon2': '0.368', 'WEAPON3': '0.600', 'weapon5': '0.788', 'weapon3': '2.400', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.050'} +[2023-09-14 12:45:26,396][102003] DAMAGECOUNT value on done: 185.0 +[2023-09-14 12:45:26,396][102003] DAMAGECOUNT value on done: 150.0 +[2023-09-14 12:45:26,397][102003] Sum rewards: 4.528, reward structure: {'HEALTH': '-1.550', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO5': '0.009', 'AMMO4': '0.010', 'AMMO3': '0.040', 'weapon4': '0.096', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.796', 'weapon2': '0.946', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.450', 'weapon3': '2.030'} +[2023-09-14 12:45:26,555][102001] DAMAGECOUNT value on done: 270.0 +[2023-09-14 12:45:26,555][102001] DAMAGECOUNT value on done: 270.0 +[2023-09-14 12:45:26,555][102001] Sum rewards: 3.368, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'AMMO3': '0.030', 'AMMO4': '0.074', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.246', 'WEAPON3': '0.300', 'weapon5': '0.424', 'weapon4': '0.652', 'FRAGCOUNT': '1.000', 'weapon3': '1.122', 'DAMAGECOUNT': '1.200'} +[2023-09-14 12:45:26,556][102001] Sum rewards: 4.566, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.040', 'AMMO4': '0.097', 'WEAPON5': '0.100', 'weapon2': '0.128', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.584', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.324', 'weapon5': '1.768'} +[2023-09-14 12:45:26,679][101964] Updated weights for policy 1, policy_version 967 (0.0013) +[2023-09-14 12:45:26,778][102039] DAMAGECOUNT value on done: 165.0 +[2023-09-14 12:45:26,778][102039] DAMAGECOUNT value on done: 445.0 +[2023-09-14 12:45:26,779][102039] Sum rewards: 6.399, reward structure: {'HEALTH': '-0.350', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.708', 'weapon3': '0.892', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.350', 'weapon5': '2.474'} +[2023-09-14 12:45:26,966][101965] Updated weights for policy 0, policy_version 1765 (0.0013) +[2023-09-14 12:45:27,031][102003] DAMAGECOUNT value on done: 340.0 +[2023-09-14 12:45:27,032][102003] DAMAGECOUNT value on done: 264.0 +[2023-09-14 12:45:27,033][102003] Sum rewards: 2.733, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'AMMO2': '0.014', 'AMMO3': '0.063', 'AMMO4': '0.069', 'weapon2': '0.100', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.354', 'weapon5': '0.544', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.640', 'FRAGCOUNT': '0.998', 'weapon3': '2.838'} +[2023-09-14 12:45:27,376][102039] DAMAGECOUNT value on done: 186.0 +[2023-09-14 12:45:27,377][102039] Sum rewards: 2.780, reward structure: {'HEALTH': '-2.150', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO4': '0.009', 'AMMO5': '0.015', 'AMMO3': '0.071', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.654', 'weapon5': '0.794', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '2.434'} +[2023-09-14 12:45:27,377][102039] DAMAGECOUNT value on done: 335.0 +[2023-09-14 12:45:27,378][102039] Sum rewards: 6.447, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.020', 'AMMO3': '0.041', 'AMMO4': '0.102', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.232', 'weapon2': '0.242', 'WEAPON3': '0.400', 'weapon4': '0.650', 'FRAGCOUNT': '2.000', 'weapon3': '2.000', 'DAMAGECOUNT': '2.350'} +[2023-09-14 12:45:27,851][102003] DAMAGECOUNT value on done: 393.0 +[2023-09-14 12:45:27,851][102003] DAMAGECOUNT value on done: 345.0 +[2023-09-14 12:45:27,852][102003] Sum rewards: 2.592, reward structure: {'HEALTH': '-3.600', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.025', 'AMMO3': '0.072', 'weapon5': '0.120', 'AMMO4': '0.123', 'WEAPON5': '0.200', 'weapon2': '0.286', 'WEAPON4': '0.400', 'WEAPON3': '0.600', 'weapon4': '0.864', 'weapon3': '1.764', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.730'} +[2023-09-14 12:45:27,852][102003] Sum rewards: 4.647, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.013', 'AMMO4': '0.063', 'AMMO3': '0.092', 'weapon5': '0.118', 'WEAPON5': '0.200', 'WEAPON4': '0.400', 'weapon2': '0.426', 'WEAPON3': '0.700', 'weapon4': '0.874', 'weapon3': '1.702', 'FRAGCOUNT': '2.999', 'DAMAGECOUNT': '3.050'} +[2023-09-14 12:45:27,932][102001] DAMAGECOUNT value on done: 345.0 +[2023-09-14 12:45:27,932][102001] DAMAGECOUNT value on done: 165.0 +[2023-09-14 12:45:27,933][102001] Sum rewards: 7.916, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'AMMO3': '0.040', 'weapon2': '0.040', 'AMMO4': '0.074', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.638', 'weapon4': '0.720', 'weapon3': '1.384', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.450'} +[2023-09-14 12:45:27,933][102001] Sum rewards: 1.359, reward structure: {'HEALTH': '-3.250', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.012', 'AMMO5': '0.015', 'AMMO4': '0.061', 'AMMO3': '0.084', 'weapon2': '0.100', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.344', 'weapon5': '0.536', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.250', 'weapon3': '3.006'} +[2023-09-14 12:45:28,606][102001] DAMAGECOUNT value on done: 165.0 +[2023-09-14 12:45:28,606][102001] DAMAGECOUNT value on done: 225.0 +[2023-09-14 12:45:28,607][102001] Sum rewards: 2.271, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.043', 'AMMO2': '-0.009', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.250', 'WEAPON3': '0.400', 'weapon2': '0.690', 'weapon5': '1.454', 'weapon3': '1.780'} +[2023-09-14 12:45:29,578][109198] Fps is (10 sec: 15564.4, 60 sec: 14472.5, 300 sec: 12743.1). Total num frames: 11231232. Throughput: 0: 1695.1, 1: 1825.4. Samples: 282093. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:45:29,580][109198] Avg episode reward: [(0, '4.294'), (1, '3.546')] +[2023-09-14 12:45:32,432][101965] Updated weights for policy 0, policy_version 1775 (0.0012) +[2023-09-14 12:45:32,616][101964] Updated weights for policy 1, policy_version 977 (0.0011) +[2023-09-14 12:45:34,577][109198] Fps is (10 sec: 14745.6, 60 sec: 14336.0, 300 sec: 12805.4). Total num frames: 11300864. Throughput: 0: 1704.5, 1: 1839.1. Samples: 293268. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:45:34,579][109198] Avg episode reward: [(0, '4.294'), (1, '3.546')] +[2023-09-14 12:45:37,765][101965] Updated weights for policy 0, policy_version 1785 (0.0014) +[2023-09-14 12:45:38,429][101964] Updated weights for policy 1, policy_version 987 (0.0013) +[2023-09-14 12:45:39,577][109198] Fps is (10 sec: 13926.7, 60 sec: 14336.0, 300 sec: 12861.5). Total num frames: 11370496. Throughput: 0: 1723.7, 1: 1827.4. Samples: 315044. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:45:39,579][109198] Avg episode reward: [(0, '4.294'), (1, '3.546')] +[2023-09-14 12:45:43,236][101965] Updated weights for policy 0, policy_version 1795 (0.0014) +[2023-09-14 12:45:44,336][101964] Updated weights for policy 1, policy_version 997 (0.0013) +[2023-09-14 12:45:44,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14336.0, 300 sec: 12951.2). Total num frames: 11444224. Throughput: 0: 1751.9, 1: 1807.8. Samples: 336801. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:45:44,579][109198] Avg episode reward: [(0, '4.294'), (1, '3.546')] +[2023-09-14 12:45:48,945][101965] Updated weights for policy 0, policy_version 1805 (0.0013) +[2023-09-14 12:45:49,577][109198] Fps is (10 sec: 14335.9, 60 sec: 14336.0, 300 sec: 12995.5). Total num frames: 11513856. Throughput: 0: 1772.0, 1: 1806.7. Samples: 347433. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:45:49,579][109198] Avg episode reward: [(0, '4.294'), (1, '3.546')] +[2023-09-14 12:45:49,583][101718] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001806_7397376.pth... +[2023-09-14 12:45:49,583][101802] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001005_4116480.pth... +[2023-09-14 12:45:49,654][101718] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001439_5894144.pth +[2023-09-14 12:45:49,675][101802] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000722_2957312.pth +[2023-09-14 12:45:50,625][101964] Updated weights for policy 1, policy_version 1007 (0.0013) +[2023-09-14 12:45:54,518][102037] DAMAGECOUNT value on done: 340.0 +[2023-09-14 12:45:54,518][102037] DAMAGECOUNT value on done: 537.0 +[2023-09-14 12:45:54,577][109198] Fps is (10 sec: 13516.8, 60 sec: 14199.5, 300 sec: 13000.4). Total num frames: 11579392. Throughput: 0: 1781.6, 1: 1767.1. Samples: 367503. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:45:54,579][109198] Avg episode reward: [(0, '4.294'), (1, '3.546')] +[2023-09-14 12:45:54,715][101965] Updated weights for policy 0, policy_version 1815 (0.0014) +[2023-09-14 12:45:55,140][102037] DAMAGECOUNT value on done: 581.0 +[2023-09-14 12:45:55,140][102037] DAMAGECOUNT value on done: 400.0 +[2023-09-14 12:45:55,141][102037] Sum rewards: 6.065, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO2': '0.029', 'AMMO3': '0.042', 'AMMO4': '0.144', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'weapon2': '0.428', 'weapon4': '0.764', 'weapon3': '1.220', 'weapon5': '1.322', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '3.210'} +[2023-09-14 12:45:55,141][102037] Sum rewards: 1.668, reward structure: {'HEALTH': '-2.810', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.006', 'AMMO5': '0.015', 'AMMO3': '0.071', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'weapon4': '0.310', 'weapon2': '0.338', 'DAMAGECOUNT': '0.550', 'WEAPON3': '0.600', 'weapon5': '0.880', 'FRAGCOUNT': '1.000', 'weapon3': '2.306'} +[2023-09-14 12:45:55,271][102037] DAMAGECOUNT value on done: 400.0 +[2023-09-14 12:45:55,271][102037] DAMAGECOUNT value on done: 480.0 +[2023-09-14 12:45:55,272][102037] Sum rewards: 4.807, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.011', 'AMMO3': '0.039', 'AMMO4': '0.056', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon2': '0.310', 'weapon4': '0.314', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.350', 'weapon5': '1.650', 'weapon3': '1.666'} +[2023-09-14 12:45:55,273][102037] Sum rewards: 4.769, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.016', 'AMMO3': '0.034', 'AMMO4': '0.081', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon4': '0.222', 'WEAPON3': '0.300', 'weapon2': '0.350', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.350', 'weapon3': '1.364', 'weapon5': '2.046'} +[2023-09-14 12:45:55,916][102037] DAMAGECOUNT value on done: 470.0 +[2023-09-14 12:45:55,916][102037] DAMAGECOUNT value on done: 379.0 +[2023-09-14 12:45:56,746][101964] Updated weights for policy 1, policy_version 1017 (0.0012) +[2023-09-14 12:45:56,841][102005] DAMAGECOUNT value on done: 365.0 +[2023-09-14 12:45:56,842][102005] DAMAGECOUNT value on done: 292.0 +[2023-09-14 12:45:56,842][102005] Sum rewards: 4.747, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO4': '0.009', 'AMMO5': '0.009', 'AMMO3': '0.051', 'weapon4': '0.072', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.426', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.226', 'weapon5': '2.252'} +[2023-09-14 12:45:56,843][102005] Sum rewards: 2.465, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'weapon2': '0.016', 'AMMO3': '0.023', 'AMMO2': '0.033', 'WEAPON5': '0.100', 'weapon5': '0.134', 'AMMO4': '0.165', 'WEAPON3': '0.200', 'WEAPON4': '0.200', 'weapon3': '0.570', 'weapon4': '0.948', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.070'} +[2023-09-14 12:45:57,432][102005] DAMAGECOUNT value on done: 880.0 +[2023-09-14 12:45:57,432][102005] DAMAGECOUNT value on done: 595.0 +[2023-09-14 12:45:57,433][102005] Sum rewards: 2.367, reward structure: {'HEALTH': '-3.250', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'AMMO2': '0.025', 'AMMO3': '0.087', 'weapon5': '0.118', 'AMMO4': '0.124', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon2': '0.314', 'weapon4': '0.666', 'WEAPON3': '0.700', 'weapon3': '1.870', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:45:57,432][102005] Sum rewards: 5.370, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.020', 'weapon2': '0.040', 'AMMO3': '0.065', 'AMMO4': '0.101', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.600', 'weapon5': '0.742', 'weapon4': '1.004', 'weapon3': '1.688', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.600'} +[2023-09-14 12:45:57,796][102004] DAMAGECOUNT value on done: 355.0 +[2023-09-14 12:45:57,797][102004] DAMAGECOUNT value on done: 289.0 +[2023-09-14 12:45:57,797][102004] Sum rewards: 5.619, reward structure: {'HEALTH': '-0.950', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.346', 'FRAGCOUNT': '1.000', 'weapon3': '1.044', 'DAMAGECOUNT': '1.100', 'weapon5': '2.724'} +[2023-09-14 12:45:58,301][102004] DAMAGECOUNT value on done: 315.0 +[2023-09-14 12:45:58,302][102004] DAMAGECOUNT value on done: 620.0 +[2023-09-14 12:45:58,302][102004] Sum rewards: 2.827, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.007', 'AMMO5': '0.010', 'AMMO3': '0.058', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon2': '0.282', 'WEAPON3': '0.500', 'weapon4': '0.548', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon5': '1.302', 'weapon3': '1.668'} +[2023-09-14 12:45:58,303][102004] Sum rewards: 6.422, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.338', 'weapon2': '0.344', 'WEAPON3': '0.400', 'weapon5': '1.142', 'weapon3': '1.748', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:45:58,375][102040] DAMAGECOUNT value on done: 365.0 +[2023-09-14 12:45:58,376][102040] DAMAGECOUNT value on done: 585.0 +[2023-09-14 12:45:58,376][102040] Sum rewards: 4.476, reward structure: {'HEALTH': '-1.550', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.055', 'WEAPON5': '0.100', 'weapon2': '0.344', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon3': '1.230', 'DAMAGECOUNT': '1.400', 'weapon5': '2.522'} +[2023-09-14 12:45:58,376][102040] Sum rewards: 3.206, reward structure: {'HEALTH': '-1.870', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.020', 'AMMO3': '0.047', 'weapon2': '0.058', 'AMMO4': '0.099', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.560', 'weapon4': '0.806', 'FRAGCOUNT': '1.000', 'weapon3': '1.078', 'DAMAGECOUNT': '1.600'} +[2023-09-14 12:45:58,921][102040] DAMAGECOUNT value on done: 447.0 +[2023-09-14 12:45:58,922][102040] DAMAGECOUNT value on done: 213.0 +[2023-09-14 12:45:59,577][109198] Fps is (10 sec: 13516.9, 60 sec: 14199.5, 300 sec: 13039.0). Total num frames: 11649024. Throughput: 0: 1798.7, 1: 1738.6. Samples: 388210. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:45:59,579][109198] Avg episode reward: [(0, '4.284'), (1, '3.598')] +[2023-09-14 12:46:00,320][101965] Updated weights for policy 0, policy_version 1825 (0.0012) +[2023-09-14 12:46:00,793][102005] DAMAGECOUNT value on done: 490.0 +[2023-09-14 12:46:00,793][102005] DAMAGECOUNT value on done: 324.0 +[2023-09-14 12:46:00,794][102005] Sum rewards: 3.892, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.020', 'AMMO3': '0.029', 'AMMO4': '0.100', 'WEAPON5': '0.100', 'weapon2': '0.118', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon5': '0.370', 'weapon4': '0.784', 'FRAGCOUNT': '0.999', 'weapon3': '1.068', 'DAMAGECOUNT': '1.800'} +[2023-09-14 12:46:00,794][102005] Sum rewards: 0.862, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.011', 'AMMO4': '0.053', 'AMMO3': '0.077', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.242', 'WEAPON3': '0.600', 'weapon2': '0.658', 'weapon5': '1.372', 'weapon3': '1.440'} +[2023-09-14 12:46:01,381][102005] DAMAGECOUNT value on done: 510.0 +[2023-09-14 12:46:01,381][102005] DAMAGECOUNT value on done: 590.0 +[2023-09-14 12:46:01,382][102005] Sum rewards: 6.511, reward structure: {'HEALTH': '-2.500', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.072', 'weapon2': '0.110', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.434', 'WEAPON3': '0.600', 'weapon5': '1.002', 'weapon3': '2.128', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.150'} +[2023-09-14 12:46:01,382][102005] Sum rewards: 3.988, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.031', 'AMMO3': '0.068', 'AMMO4': '0.153', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon2': '0.332', 'weapon4': '0.390', 'WEAPON3': '0.600', 'weapon5': '0.782', 'FRAGCOUNT': '2.000', 'weapon3': '2.416', 'DAMAGECOUNT': '2.600'} +[2023-09-14 12:46:01,413][102004] DAMAGECOUNT value on done: 597.0 +[2023-09-14 12:46:01,413][102004] DAMAGECOUNT value on done: 481.0 +[2023-09-14 12:46:01,414][102004] Sum rewards: 3.892, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'weapon2': '0.002', 'AMMO5': '0.015', 'AMMO3': '0.065', 'WEAPON4': '0.100', 'weapon4': '0.232', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon5': '1.204', 'DAMAGECOUNT': '1.850', 'weapon3': '2.524'} +[2023-09-14 12:46:01,414][102004] Sum rewards: 6.042, reward structure: {'HEALTH': '-1.850', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'weapon2': '0.016', 'AMMO4': '0.024', 'AMMO3': '0.053', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.314', 'WEAPON3': '0.400', 'weapon3': '1.142', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150', 'weapon5': '2.478'} +[2023-09-14 12:46:01,965][102004] DAMAGECOUNT value on done: 637.0 +[2023-09-14 12:46:01,965][102004] DAMAGECOUNT value on done: 530.0 +[2023-09-14 12:46:01,966][102004] Sum rewards: 5.831, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'AMMO3': '0.043', 'weapon2': '0.066', 'AMMO4': '0.074', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.698', 'weapon5': '0.938', 'weapon3': '1.242', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:46:01,966][102004] Sum rewards: 2.574, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.011', 'AMMO5': '0.015', 'AMMO4': '0.055', 'AMMO3': '0.060', 'WEAPON4': '0.100', 'weapon4': '0.172', 'WEAPON5': '0.300', 'WEAPON3': '0.500', 'weapon2': '0.746', 'weapon5': '0.788', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.776'} +[2023-09-14 12:46:02,694][102040] DAMAGECOUNT value on done: 665.0 +[2023-09-14 12:46:02,694][102040] DAMAGECOUNT value on done: 270.0 +[2023-09-14 12:46:02,695][102040] Sum rewards: 0.711, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.036', 'AMMO3': '0.039', 'WEAPON5': '0.100', 'AMMO4': '0.179', 'WEAPON4': '0.300', 'WEAPON3': '0.300', 'weapon2': '0.410', 'weapon3': '0.604', 'weapon4': '0.644', 'DAMAGECOUNT': '0.850', 'weapon5': '1.248'} +[2023-09-14 12:46:02,695][102040] Sum rewards: 4.617, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.015', 'AMMO3': '0.045', 'AMMO4': '0.074', 'weapon2': '0.130', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.664', 'FRAGCOUNT': '0.999', 'weapon3': '1.038', 'DAMAGECOUNT': '1.400', 'weapon5': '1.492'} +[2023-09-14 12:46:02,728][101964] Updated weights for policy 1, policy_version 1027 (0.0012) +[2023-09-14 12:46:03,064][102046] DAMAGECOUNT value on done: 470.0 +[2023-09-14 12:46:03,065][102046] DAMAGECOUNT value on done: 475.0 +[2023-09-14 12:46:03,065][102046] Sum rewards: 1.233, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.024', 'AMMO3': '0.076', 'weapon2': '0.102', 'AMMO4': '0.118', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.600', 'weapon4': '0.716', 'weapon5': '0.920', 'FRAGCOUNT': '0.999', 'weapon3': '1.518', 'DAMAGECOUNT': '1.650'} +[2023-09-14 12:46:03,066][102046] Sum rewards: 5.910, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.021', 'AMMO3': '0.060', 'AMMO4': '0.105', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon2': '0.348', 'weapon5': '0.406', 'weapon4': '0.488', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.550', 'weapon3': '2.718'} +[2023-09-14 12:46:03,114][102039] DAMAGECOUNT value on done: 369.0 +[2023-09-14 12:46:03,114][102039] DAMAGECOUNT value on done: 545.0 +[2023-09-14 12:46:03,208][102040] DAMAGECOUNT value on done: 305.0 +[2023-09-14 12:46:03,208][102040] DAMAGECOUNT value on done: 385.0 +[2023-09-14 12:46:03,209][102040] Sum rewards: 5.647, reward structure: {'HEALTH': '-0.750', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.708', 'weapon3': '0.780', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.000', 'weapon5': '2.584'} +[2023-09-14 12:46:03,593][102046] DAMAGECOUNT value on done: 509.0 +[2023-09-14 12:46:03,593][102046] DAMAGECOUNT value on done: 670.0 +[2023-09-14 12:46:03,594][102046] Sum rewards: 1.131, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO2': '0.015', 'AMMO3': '0.053', 'AMMO4': '0.075', 'weapon2': '0.172', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.400', 'WEAPON3': '0.500', 'weapon4': '0.878', 'weapon5': '0.996', 'weapon3': '1.536'} +[2023-09-14 12:46:03,594][102046] Sum rewards: 4.512, reward structure: {'HEALTH': '-0.400', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.015', 'AMMO3': '0.019', 'AMMO4': '0.075', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.206', 'weapon4': '0.436', 'weapon3': '0.650', 'weapon5': '0.908', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.200'} +[2023-09-14 12:46:03,668][102039] DAMAGECOUNT value on done: 510.0 +[2023-09-14 12:46:03,669][102039] DAMAGECOUNT value on done: 1072.0 +[2023-09-14 12:46:03,669][102039] Sum rewards: 0.034, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.013', 'AMMO4': '0.067', 'AMMO3': '0.080', 'weapon2': '0.168', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon4': '0.516', 'WEAPON3': '0.700', 'weapon5': '0.774', 'DAMAGECOUNT': '1.200', 'weapon3': '2.008'} +[2023-09-14 12:46:03,670][102039] Sum rewards: 5.488, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO2': '0.028', 'AMMO3': '0.072', 'AMMO4': '0.140', 'weapon2': '0.146', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.600', 'weapon5': '0.766', 'FRAGCOUNT': '0.999', 'weapon4': '1.024', 'weapon3': '1.636', 'DAMAGECOUNT': '3.570'} +[2023-09-14 12:46:04,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14267.7, 300 sec: 13107.2). Total num frames: 11722752. Throughput: 0: 1815.7, 1: 1729.0. Samples: 398942. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:46:04,579][109198] Avg episode reward: [(0, '4.321'), (1, '3.491')] +[2023-09-14 12:46:04,894][102039] DAMAGECOUNT value on done: 635.0 +[2023-09-14 12:46:04,895][102039] DAMAGECOUNT value on done: 275.0 +[2023-09-14 12:46:04,895][102039] Sum rewards: 5.564, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.039', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.314', 'weapon2': '0.356', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon5': '1.588', 'weapon3': '1.656', 'DAMAGECOUNT': '1.900'} +[2023-09-14 12:46:04,896][102039] Sum rewards: 2.239, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.037', 'AMMO3': '0.059', 'WEAPON5': '0.100', 'AMMO4': '0.184', 'weapon2': '0.214', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon5': '0.572', 'weapon4': '0.812', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.100', 'weapon3': '1.458'} +[2023-09-14 12:46:04,954][102003] DAMAGECOUNT value on done: 260.0 +[2023-09-14 12:46:04,954][102003] DAMAGECOUNT value on done: 270.0 +[2023-09-14 12:46:04,955][102003] Sum rewards: 3.048, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.022', 'AMMO3': '0.060', 'weapon2': '0.104', 'AMMO4': '0.111', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon4': '0.802', 'FRAGCOUNT': '0.999', 'weapon5': '1.056', 'DAMAGECOUNT': '1.100', 'weapon3': '1.786'} +[2023-09-14 12:46:04,955][102003] Sum rewards: 4.804, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.704', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.250', 'weapon3': '1.572', 'weapon5': '1.738'} +[2023-09-14 12:46:05,044][102046] DAMAGECOUNT value on done: 290.0 +[2023-09-14 12:46:05,045][102046] DAMAGECOUNT value on done: 230.0 +[2023-09-14 12:46:05,045][102046] Sum rewards: 5.125, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.030', 'AMMO4': '0.049', 'WEAPON5': '0.100', 'weapon2': '0.132', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.600', 'FRAGCOUNT': '0.999', 'weapon3': '1.082', 'DAMAGECOUNT': '1.600', 'weapon5': '2.020'} +[2023-09-14 12:46:05,046][102046] Sum rewards: 1.463, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.023', 'AMMO3': '0.074', 'AMMO4': '0.115', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.368', 'weapon4': '0.456', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.900', 'weapon2': '1.156', 'weapon3': '1.364'} +[2023-09-14 12:46:05,446][102039] DAMAGECOUNT value on done: 625.0 +[2023-09-14 12:46:05,446][102039] DAMAGECOUNT value on done: 543.0 +[2023-09-14 12:46:05,447][102039] Sum rewards: 3.663, reward structure: {'HEALTH': '-2.650', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.013', 'AMMO3': '0.060', 'AMMO4': '0.067', 'WEAPON5': '0.100', 'WEAPON4': '0.300', 'weapon2': '0.378', 'weapon5': '0.426', 'WEAPON3': '0.600', 'weapon4': '0.690', 'FRAGCOUNT': '1.000', 'weapon3': '1.776', 'DAMAGECOUNT': '2.900'} +[2023-09-14 12:46:05,447][102039] Sum rewards: 4.829, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.011', 'AMMO2': '0.019', 'AMMO3': '0.089', 'AMMO4': '0.095', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon2': '0.350', 'weapon5': '0.664', 'WEAPON3': '0.700', 'weapon4': '0.990', 'weapon3': '1.742', 'FRAGCOUNT': '1.998', 'DAMAGECOUNT': '3.570'} +[2023-09-14 12:46:05,634][102003] DAMAGECOUNT value on done: 190.0 +[2023-09-14 12:46:05,634][102003] DAMAGECOUNT value on done: 320.0 +[2023-09-14 12:46:05,635][102003] Sum rewards: 5.523, reward structure: {'HEALTH': '-0.080', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'AMMO2': '0.025', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.125', 'WEAPON3': '0.200', 'weapon2': '0.410', 'weapon5': '0.614', 'weapon4': '0.622', 'weapon3': '0.684', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.700'} +[2023-09-14 12:46:05,679][101965] Updated weights for policy 0, policy_version 1835 (0.0013) +[2023-09-14 12:46:05,768][102046] DAMAGECOUNT value on done: 710.0 +[2023-09-14 12:46:05,768][102046] DAMAGECOUNT value on done: 493.0 +[2023-09-14 12:46:05,768][102046] Sum rewards: 3.178, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.016', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon4': '0.196', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.476', 'DAMAGECOUNT': '0.600', 'weapon5': '1.386', 'weapon3': '1.752'} +[2023-09-14 12:46:05,786][102001] DAMAGECOUNT value on done: 299.0 +[2023-09-14 12:46:05,786][102001] DAMAGECOUNT value on done: 331.0 +[2023-09-14 12:46:06,268][102003] DAMAGECOUNT value on done: 485.0 +[2023-09-14 12:46:06,268][102003] DAMAGECOUNT value on done: 553.0 +[2023-09-14 12:46:06,268][102003] Sum rewards: 4.149, reward structure: {'HEALTH': '-2.080', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.015', 'AMMO4': '0.074', 'AMMO3': '0.075', 'weapon2': '0.148', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.358', 'WEAPON3': '0.600', 'weapon4': '0.668', 'weapon3': '1.674', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.210'} +[2023-09-14 12:46:06,269][102003] Sum rewards: 5.023, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO4': '0.011', 'AMMO5': '0.015', 'AMMO3': '0.066', 'WEAPON4': '0.200', 'weapon2': '0.230', 'WEAPON5': '0.300', 'weapon5': '0.390', 'weapon4': '0.522', 'WEAPON3': '0.600', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.130', 'weapon3': '2.556'} +[2023-09-14 12:46:06,427][102001] DAMAGECOUNT value on done: 395.0 +[2023-09-14 12:46:06,427][102001] DAMAGECOUNT value on done: 385.0 +[2023-09-14 12:46:06,428][102001] Sum rewards: 3.153, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.026', 'AMMO3': '0.037', 'WEAPON5': '0.100', 'AMMO4': '0.129', 'weapon2': '0.130', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon5': '0.676', 'weapon3': '0.720', 'weapon4': '0.732', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.250'} +[2023-09-14 12:46:06,428][102001] Sum rewards: 4.796, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.014', 'AMMO3': '0.040', 'weapon2': '0.068', 'AMMO4': '0.071', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.560', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon5': '1.494', 'weapon3': '1.688'} +[2023-09-14 12:46:06,915][102003] DAMAGECOUNT value on done: 598.0 +[2023-09-14 12:46:06,915][102003] DAMAGECOUNT value on done: 400.0 +[2023-09-14 12:46:06,916][102003] Sum rewards: 6.620, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.724', 'weapon5': '1.608', 'weapon3': '1.650', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:46:07,777][102001] DAMAGECOUNT value on done: 563.0 +[2023-09-14 12:46:07,778][102001] DAMAGECOUNT value on done: 215.0 +[2023-09-14 12:46:07,778][102001] Sum rewards: 6.344, reward structure: {'HEALTH': '-1.250', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.007', 'AMMO4': '0.035', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.342', 'WEAPON3': '0.400', 'weapon2': '0.610', 'weapon5': '1.174', 'weapon3': '1.498', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.180'} +[2023-09-14 12:46:07,779][102001] Sum rewards: 2.635, reward structure: {'HEALTH': '-2.150', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.025', 'AMMO3': '0.081', 'AMMO4': '0.123', 'weapon4': '0.150', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.500', 'WEAPON3': '0.600', 'weapon2': '0.706', 'FRAGCOUNT': '1.000', 'weapon5': '1.256', 'weapon3': '1.828'} +[2023-09-14 12:46:08,529][102001] DAMAGECOUNT value on done: 270.0 +[2023-09-14 12:46:08,529][102001] DAMAGECOUNT value on done: 305.0 +[2023-09-14 12:46:08,530][102001] Sum rewards: 4.068, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.044', 'AMMO4': '0.050', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.618', 'FRAGCOUNT': '0.999', 'weapon3': '1.072', 'weapon5': '1.172', 'DAMAGECOUNT': '1.400'} +[2023-09-14 12:46:08,800][101964] Updated weights for policy 1, policy_version 1037 (0.0013) +[2023-09-14 12:46:09,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14267.7, 300 sec: 13138.7). Total num frames: 11792384. Throughput: 0: 1844.8, 1: 1704.6. Samples: 420519. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:46:09,579][109198] Avg episode reward: [(0, '4.320'), (1, '3.487')] +[2023-09-14 12:46:11,328][101965] Updated weights for policy 0, policy_version 1845 (0.0015) +[2023-09-14 12:46:14,577][109198] Fps is (10 sec: 14336.1, 60 sec: 14336.0, 300 sec: 13198.2). Total num frames: 11866112. Throughput: 0: 1852.7, 1: 1704.5. Samples: 442166. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0) +[2023-09-14 12:46:14,579][109198] Avg episode reward: [(0, '4.320'), (1, '3.487')] +[2023-09-14 12:46:14,945][101964] Updated weights for policy 1, policy_version 1047 (0.0013) +[2023-09-14 12:46:16,807][101965] Updated weights for policy 0, policy_version 1855 (0.0014) +[2023-09-14 12:46:19,577][109198] Fps is (10 sec: 14336.1, 60 sec: 14336.0, 300 sec: 13224.3). Total num frames: 11935744. Throughput: 0: 1847.1, 1: 1694.0. Samples: 452617. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:46:19,579][109198] Avg episode reward: [(0, '4.320'), (1, '3.487')] +[2023-09-14 12:46:20,880][101964] Updated weights for policy 1, policy_version 1057 (0.0012) +[2023-09-14 12:46:22,412][101965] Updated weights for policy 0, policy_version 1865 (0.0016) +[2023-09-14 12:46:24,577][109198] Fps is (10 sec: 13516.7, 60 sec: 14131.2, 300 sec: 13220.2). Total num frames: 12001280. Throughput: 0: 1833.4, 1: 1684.3. Samples: 473341. Policy #0 lag: (min: 0.0, avg: 0.6, max: 3.0) +[2023-09-14 12:46:24,579][109198] Avg episode reward: [(0, '4.320'), (1, '3.487')] +[2023-09-14 12:46:27,205][101964] Updated weights for policy 1, policy_version 1067 (0.0013) +[2023-09-14 12:46:28,092][101965] Updated weights for policy 0, policy_version 1875 (0.0013) +[2023-09-14 12:46:29,577][109198] Fps is (10 sec: 13516.7, 60 sec: 13994.7, 300 sec: 13243.7). Total num frames: 12070912. Throughput: 0: 1824.8, 1: 1672.8. Samples: 494192. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:46:29,579][109198] Avg episode reward: [(0, '4.320'), (1, '3.487')] +[2023-09-14 12:46:31,081][102004] DAMAGECOUNT value on done: 494.0 +[2023-09-14 12:46:31,082][102004] DAMAGECOUNT value on done: 821.0 +[2023-09-14 12:46:31,083][102004] Sum rewards: 6.784, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'weapon2': '0.006', 'AMMO5': '0.013', 'AMMO4': '0.025', 'AMMO3': '0.080', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon5': '0.340', 'WEAPON3': '0.700', 'weapon4': '0.754', 'weapon3': '2.602', 'FRAGCOUNT': '2.999', 'DAMAGECOUNT': '4.660'} +[2023-09-14 12:46:31,082][102004] Sum rewards: 2.803, reward structure: {'HEALTH': '-3.700', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.016', 'AMMO5': '0.020', 'AMMO4': '0.079', 'AMMO3': '0.089', 'weapon2': '0.124', 'WEAPON4': '0.200', 'weapon5': '0.240', 'WEAPON5': '0.400', 'weapon4': '0.512', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050', 'weapon3': '2.972'} +[2023-09-14 12:46:31,656][102004] DAMAGECOUNT value on done: 690.0 +[2023-09-14 12:46:31,656][102004] DAMAGECOUNT value on done: 435.0 +[2023-09-14 12:46:31,657][102004] Sum rewards: 5.863, reward structure: {'HEALTH': '-0.700', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.398', 'weapon3': '0.724', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.200', 'weapon5': '2.946'} +[2023-09-14 12:46:31,686][102037] DAMAGECOUNT value on done: 746.0 +[2023-09-14 12:46:31,686][102037] DAMAGECOUNT value on done: 515.0 +[2023-09-14 12:46:31,687][102037] Sum rewards: 4.575, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.004', 'AMMO5': '0.007', 'AMMO2': '0.024', 'AMMO3': '0.059', 'AMMO4': '0.120', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon4': '0.564', 'weapon5': '1.102', 'weapon3': '1.604', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.090'} +[2023-09-14 12:46:31,687][102037] Sum rewards: 5.097, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.028', 'AMMO3': '0.068', 'AMMO4': '0.139', 'weapon2': '0.144', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.480', 'WEAPON3': '0.600', 'weapon5': '1.330', 'DAMAGECOUNT': '1.750', 'FRAGCOUNT': '2.000', 'weapon3': '2.042'} +[2023-09-14 12:46:32,297][102037] DAMAGECOUNT value on done: 696.0 +[2023-09-14 12:46:32,298][102037] DAMAGECOUNT value on done: 565.0 +[2023-09-14 12:46:32,298][102037] Sum rewards: 1.103, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.027', 'AMMO3': '0.052', 'WEAPON5': '0.100', 'AMMO4': '0.132', 'weapon2': '0.162', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'weapon4': '0.898', 'weapon5': '0.908', 'weapon3': '0.970', 'DAMAGECOUNT': '1.150'} +[2023-09-14 12:46:32,298][102037] Sum rewards: 5.079, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.938', 'FRAGCOUNT': '0.999', 'weapon5': '1.318', 'DAMAGECOUNT': '1.650', 'weapon3': '1.742'} +[2023-09-14 12:46:32,489][102037] DAMAGECOUNT value on done: 900.0 +[2023-09-14 12:46:32,489][102037] DAMAGECOUNT value on done: 800.0 +[2023-09-14 12:46:32,490][102037] Sum rewards: 6.715, reward structure: {'HEALTH': '-3.800', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO5': '0.015', 'AMMO4': '0.048', 'AMMO3': '0.099', 'WEAPON4': '0.200', 'weapon5': '0.256', 'WEAPON5': '0.300', 'weapon4': '0.304', 'weapon2': '0.578', 'WEAPON3': '0.800', 'weapon3': '2.704', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.200'} +[2023-09-14 12:46:32,490][102037] Sum rewards: 4.739, reward structure: {'HEALTH': '-4.000', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.020', 'weapon2': '0.068', 'AMMO4': '0.100', 'AMMO3': '0.119', 'WEAPON5': '0.400', 'WEAPON4': '0.400', 'weapon5': '0.522', 'weapon4': '0.694', 'WEAPON3': '0.900', 'weapon3': '2.496', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '4.000'} +[2023-09-14 12:46:33,040][102037] DAMAGECOUNT value on done: 575.0 +[2023-09-14 12:46:33,041][102037] DAMAGECOUNT value on done: 584.0 +[2023-09-14 12:46:33,041][102037] Sum rewards: 2.704, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.055', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'weapon2': '0.726', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon5': '1.442', 'weapon3': '1.780'} +[2023-09-14 12:46:33,041][102037] Sum rewards: 5.838, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.025', 'AMMO3': '0.042', 'weapon5': '0.056', 'WEAPON5': '0.100', 'AMMO4': '0.125', 'WEAPON4': '0.200', 'weapon2': '0.370', 'WEAPON3': '0.400', 'weapon4': '1.018', 'weapon3': '1.446', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:46:33,189][101964] Updated weights for policy 1, policy_version 1077 (0.0012) +[2023-09-14 12:46:33,454][101965] Updated weights for policy 0, policy_version 1885 (0.0012) +[2023-09-14 12:46:33,897][102005] DAMAGECOUNT value on done: 322.0 +[2023-09-14 12:46:33,897][102005] DAMAGECOUNT value on done: 430.0 +[2023-09-14 12:46:34,486][102005] DAMAGECOUNT value on done: 1033.0 +[2023-09-14 12:46:34,486][102005] DAMAGECOUNT value on done: 710.0 +[2023-09-14 12:46:34,487][102005] Sum rewards: 3.055, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.015', 'AMMO3': '0.020', 'AMMO4': '0.075', 'weapon2': '0.094', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.554', 'weapon3': '0.700', 'weapon4': '0.714', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.530'} +[2023-09-14 12:46:34,487][102005] Sum rewards: 3.939, reward structure: {'HEALTH': '-1.530', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.011', 'AMMO3': '0.040', 'AMMO4': '0.056', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.400', 'weapon4': '0.516', 'weapon2': '0.798', 'weapon5': '0.940', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon3': '1.352'} +[2023-09-14 12:46:34,579][109198] Fps is (10 sec: 14743.1, 60 sec: 14130.8, 300 sec: 13318.5). Total num frames: 12148736. Throughput: 0: 1830.6, 1: 1676.7. Samples: 505268. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:46:34,581][109198] Avg episode reward: [(0, '4.338'), (1, '3.478')] +[2023-09-14 12:46:34,582][101718] Saving new best policy, reward=4.338! +[2023-09-14 12:46:35,619][102040] DAMAGECOUNT value on done: 695.0 +[2023-09-14 12:46:35,619][102040] DAMAGECOUNT value on done: 660.0 +[2023-09-14 12:46:35,620][102040] Sum rewards: 0.749, reward structure: {'HEALTH': '-2.800', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.014', 'AMMO3': '0.050', 'AMMO4': '0.071', 'weapon5': '0.076', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.306', 'weapon4': '0.452', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '1.674'} +[2023-09-14 12:46:35,620][102040] Sum rewards: 5.108, reward structure: {'HEALTH': '-2.790', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.009', 'AMMO5': '0.012', 'AMMO4': '0.046', 'AMMO3': '0.060', 'weapon2': '0.110', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon4': '0.606', 'weapon5': '0.910', 'FRAGCOUNT': '1.999', 'weapon3': '2.096', 'DAMAGECOUNT': '2.950'} +[2023-09-14 12:46:36,156][102040] DAMAGECOUNT value on done: 213.0 +[2023-09-14 12:46:36,156][102040] DAMAGECOUNT value on done: 472.0 +[2023-09-14 12:46:38,065][102005] DAMAGECOUNT value on done: 610.0 +[2023-09-14 12:46:38,066][102005] Sum rewards: 3.000, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'weapon5': '0.016', 'AMMO3': '0.045', 'AMMO4': '0.075', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.594', 'weapon4': '0.622', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.200', 'weapon3': '1.328'} +[2023-09-14 12:46:38,066][102005] DAMAGECOUNT value on done: 489.0 +[2023-09-14 12:46:38,067][102005] Sum rewards: 4.730, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.010', 'AMMO3': '0.043', 'AMMO4': '0.050', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.510', 'weapon4': '0.518', 'FRAGCOUNT': '1.000', 'weapon5': '1.020', 'weapon3': '1.318', 'DAMAGECOUNT': '1.650'} +[2023-09-14 12:46:38,119][102004] DAMAGECOUNT value on done: 947.0 +[2023-09-14 12:46:38,120][102004] DAMAGECOUNT value on done: 586.0 +[2023-09-14 12:46:38,120][102004] Sum rewards: 8.179, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.026', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.364', 'WEAPON3': '0.400', 'weapon5': '0.494', 'weapon2': '0.566', 'weapon3': '1.476', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.500'} +[2023-09-14 12:46:38,121][102004] Sum rewards: 1.345, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.006', 'AMMO5': '0.015', 'AMMO4': '0.030', 'AMMO3': '0.086', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.370', 'weapon2': '0.448', 'WEAPON3': '0.700', 'weapon5': '0.962', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '2.178'} +[2023-09-14 12:46:38,600][102005] DAMAGECOUNT value on done: 725.0 +[2023-09-14 12:46:38,601][102005] DAMAGECOUNT value on done: 865.0 +[2023-09-14 12:46:38,601][102005] Sum rewards: 4.719, reward structure: {'HEALTH': '-2.650', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.027', 'AMMO3': '0.062', 'AMMO4': '0.135', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon2': '0.354', 'weapon4': '0.402', 'WEAPON3': '0.600', 'weapon5': '0.704', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150', 'weapon3': '2.420'} +[2023-09-14 12:46:38,602][102005] Sum rewards: 5.886, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.017', 'AMMO3': '0.076', 'AMMO4': '0.085', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon2': '0.380', 'weapon4': '0.396', 'WEAPON3': '0.600', 'weapon5': '1.302', 'weapon3': '1.764', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.750'} +[2023-09-14 12:46:38,771][102004] DAMAGECOUNT value on done: 679.0 +[2023-09-14 12:46:38,772][102004] DAMAGECOUNT value on done: 635.0 +[2023-09-14 12:46:38,772][102004] Sum rewards: 5.997, reward structure: {'HEALTH': '-0.420', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.356', 'weapon3': '0.818', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon5': '2.898'} +[2023-09-14 12:46:38,951][101965] Updated weights for policy 0, policy_version 1895 (0.0016) +[2023-09-14 12:46:39,071][101964] Updated weights for policy 1, policy_version 1087 (0.0012) +[2023-09-14 12:46:39,577][109198] Fps is (10 sec: 14745.8, 60 sec: 14131.2, 300 sec: 13337.6). Total num frames: 12218368. Throughput: 0: 1846.3, 1: 1690.5. Samples: 526661. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:46:39,579][109198] Avg episode reward: [(0, '4.365'), (1, '3.470')] +[2023-09-14 12:46:39,585][101718] Saving new best policy, reward=4.365! +[2023-09-14 12:46:39,892][102040] DAMAGECOUNT value on done: 815.0 +[2023-09-14 12:46:39,892][102040] DAMAGECOUNT value on done: 365.0 +[2023-09-14 12:46:39,892][102040] Sum rewards: 4.194, reward structure: {'HEALTH': '-1.350', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.015', 'AMMO3': '0.040', 'AMMO4': '0.075', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.298', 'WEAPON3': '0.400', 'weapon4': '0.598', 'weapon2': '0.710', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.500', 'weapon3': '1.500'} +[2023-09-14 12:46:39,893][102040] Sum rewards: 0.915, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.014', 'AMMO4': '0.071', 'AMMO3': '0.074', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.500', 'weapon5': '0.522', 'weapon4': '0.536', 'weapon2': '0.926', 'DAMAGECOUNT': '0.950', 'weapon3': '1.018'} +[2023-09-14 12:46:40,436][102040] DAMAGECOUNT value on done: 595.0 +[2023-09-14 12:46:40,436][102040] DAMAGECOUNT value on done: 545.0 +[2023-09-14 12:46:40,437][102040] Sum rewards: 7.165, reward structure: {'HEALTH': '-1.550', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.012', 'AMMO3': '0.040', 'weapon4': '0.050', 'AMMO4': '0.059', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.550', 'weapon3': '1.582', 'weapon5': '1.812', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.900'} +[2023-09-14 12:46:40,437][102040] Sum rewards: 2.861, reward structure: {'HEALTH': '-2.800', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.011', 'weapon2': '0.020', 'AMMO4': '0.052', 'AMMO3': '0.074', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.440', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon5': '1.314', 'DAMAGECOUNT': '1.600', 'weapon3': '2.140'} +[2023-09-14 12:46:42,305][102039] DAMAGECOUNT value on done: 560.0 +[2023-09-14 12:46:42,305][102039] DAMAGECOUNT value on done: 405.0 +[2023-09-14 12:46:42,870][102039] DAMAGECOUNT value on done: 620.0 +[2023-09-14 12:46:42,870][102039] DAMAGECOUNT value on done: 1172.0 +[2023-09-14 12:46:42,871][102039] Sum rewards: 2.643, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.016', 'AMMO3': '0.047', 'AMMO4': '0.079', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.490', 'weapon5': '0.768', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.100', 'weapon2': '1.118', 'weapon3': '1.218'} +[2023-09-14 12:46:42,871][102039] Sum rewards: 4.264, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.009', 'AMMO4': '0.045', 'AMMO3': '0.054', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.390', 'WEAPON3': '0.400', 'weapon2': '0.436', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.010', 'weapon5': '1.610'} +[2023-09-14 12:46:43,351][102046] DAMAGECOUNT value on done: 775.0 +[2023-09-14 12:46:43,351][102046] Sum rewards: 8.051, reward structure: {'HEALTH': '-1.850', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO5': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.049', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.620', 'weapon3': '1.566', 'weapon5': '1.806', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.000'} +[2023-09-14 12:46:43,351][102046] DAMAGECOUNT value on done: 655.0 +[2023-09-14 12:46:43,352][102046] Sum rewards: 0.861, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.014', 'weapon5': '0.062', 'AMMO4': '0.068', 'AMMO3': '0.084', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon2': '0.336', 'WEAPON3': '0.600', 'weapon4': '0.892', 'FRAGCOUNT': '1.000', 'weapon3': '1.444', 'DAMAGECOUNT': '1.850'} +[2023-09-14 12:46:43,936][102046] DAMAGECOUNT value on done: 698.0 +[2023-09-14 12:46:43,936][102046] DAMAGECOUNT value on done: 820.0 +[2023-09-14 12:46:44,006][102039] DAMAGECOUNT value on done: 740.0 +[2023-09-14 12:46:44,006][102039] DAMAGECOUNT value on done: 389.0 +[2023-09-14 12:46:44,007][102039] Sum rewards: 4.437, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.009', 'AMMO5': '0.010', 'weapon4': '0.032', 'AMMO3': '0.044', 'AMMO4': '0.044', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.712', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.396', 'weapon5': '1.440'} +[2023-09-14 12:46:44,007][102039] Sum rewards: 3.014, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.025', 'AMMO3': '0.038', 'WEAPON5': '0.100', 'AMMO4': '0.122', 'weapon5': '0.188', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.562', 'weapon3': '0.632', 'weapon4': '0.704', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.140'} +[2023-09-14 12:46:44,144][102001] DAMAGECOUNT value on done: 435.0 +[2023-09-14 12:46:44,145][102001] Sum rewards: 3.817, reward structure: {'HEALTH': '-1.890', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.022', 'AMMO3': '0.043', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.432', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.360', 'weapon3': '1.374', 'weapon5': '1.860'} +[2023-09-14 12:46:44,144][102001] DAMAGECOUNT value on done: 525.0 +[2023-09-14 12:46:44,145][102001] Sum rewards: 3.875, reward structure: {'HEALTH': '-1.310', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.027', 'AMMO3': '0.049', 'WEAPON5': '0.100', 'AMMO4': '0.137', 'weapon2': '0.192', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon4': '1.022', 'weapon3': '1.104', 'DAMAGECOUNT': '1.940'} +[2023-09-14 12:46:44,258][102003] DAMAGECOUNT value on done: 535.0 +[2023-09-14 12:46:44,258][102003] DAMAGECOUNT value on done: 560.0 +[2023-09-14 12:46:44,259][102003] Sum rewards: 5.183, reward structure: {'HEALTH': '-2.750', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.014', 'AMMO5': '0.015', 'AMMO4': '0.070', 'AMMO3': '0.075', 'WEAPON4': '0.100', 'weapon4': '0.248', 'WEAPON5': '0.300', 'weapon2': '0.350', 'WEAPON3': '0.600', 'weapon5': '1.488', 'weapon3': '1.922', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.750'} +[2023-09-14 12:46:44,259][102003] Sum rewards: 5.506, reward structure: {'HEALTH': '-2.600', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO5': '0.015', 'AMMO4': '0.050', 'AMMO3': '0.072', 'WEAPON4': '0.200', 'weapon2': '0.236', 'WEAPON5': '0.300', 'weapon4': '0.368', 'WEAPON3': '0.600', 'weapon5': '1.182', 'FRAGCOUNT': '2.000', 'weapon3': '2.172', 'DAMAGECOUNT': '2.900'} +[2023-09-14 12:46:44,413][101965] Updated weights for policy 0, policy_version 1905 (0.0013) +[2023-09-14 12:46:44,577][109198] Fps is (10 sec: 14338.5, 60 sec: 14131.2, 300 sec: 13380.3). Total num frames: 12292096. Throughput: 0: 1858.9, 1: 1699.2. Samples: 548326. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:46:44,579][109198] Avg episode reward: [(0, '4.477'), (1, '3.376')] +[2023-09-14 12:46:44,582][101718] Saving new best policy, reward=4.477! +[2023-09-14 12:46:44,596][102039] DAMAGECOUNT value on done: 683.0 +[2023-09-14 12:46:44,596][102039] DAMAGECOUNT value on done: 743.0 +[2023-09-14 12:46:44,597][102039] Sum rewards: 6.027, reward structure: {'HEALTH': '-0.580', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'AMMO2': '0.025', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.125', 'WEAPON3': '0.200', 'weapon5': '0.214', 'weapon2': '0.246', 'weapon3': '0.762', 'weapon4': '0.812', 'DAMAGECOUNT': '2.000', 'FRAGCOUNT': '2.000'} +[2023-09-14 12:46:44,859][102003] DAMAGECOUNT value on done: 380.0 +[2023-09-14 12:46:44,859][102003] Sum rewards: 2.124, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.015', 'AMMO3': '0.030', 'AMMO4': '0.074', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.300', 'weapon5': '0.444', 'DAMAGECOUNT': '0.600', 'weapon2': '0.664', 'weapon4': '0.690', 'weapon3': '1.298'} +[2023-09-14 12:46:44,859][102003] DAMAGECOUNT value on done: 240.0 +[2023-09-14 12:46:44,920][102001] DAMAGECOUNT value on done: 504.0 +[2023-09-14 12:46:44,920][102001] Sum rewards: 4.320, reward structure: {'HEALTH': '-0.150', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.019', 'AMMO2': '0.030', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.138', 'AMMO4': '0.149', 'WEAPON3': '0.200', 'weapon2': '0.224', 'weapon3': '0.622', 'weapon4': '0.792', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.090'} +[2023-09-14 12:46:44,921][102001] DAMAGECOUNT value on done: 400.0 +[2023-09-14 12:46:45,024][101964] Updated weights for policy 1, policy_version 1097 (0.0013) +[2023-09-14 12:46:45,038][102046] DAMAGECOUNT value on done: 295.0 +[2023-09-14 12:46:45,038][102046] DAMAGECOUNT value on done: 379.0 +[2023-09-14 12:46:45,039][102046] Sum rewards: 3.169, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.025', 'AMMO3': '0.040', 'weapon2': '0.124', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.582', 'DAMAGECOUNT': '0.890', 'weapon5': '1.214', 'weapon3': '1.582'} +[2023-09-14 12:46:45,236][102003] DAMAGECOUNT value on done: 690.0 +[2023-09-14 12:46:45,237][102003] Sum rewards: 3.000, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.030', 'AMMO3': '0.063', 'weapon2': '0.146', 'AMMO4': '0.151', 'WEAPON5': '0.300', 'WEAPON4': '0.400', 'WEAPON3': '0.500', 'weapon5': '0.792', 'weapon4': '1.122', 'weapon3': '1.432', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:46:45,237][102003] DAMAGECOUNT value on done: 758.0 +[2023-09-14 12:46:45,238][102003] Sum rewards: 4.941, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.047', 'AMMO2': '-0.009', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.070', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.716', 'weapon5': '1.302', 'weapon3': '1.944', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:46:45,684][102046] DAMAGECOUNT value on done: 590.0 +[2023-09-14 12:46:45,685][102046] DAMAGECOUNT value on done: 810.0 +[2023-09-14 12:46:45,685][102046] Sum rewards: 3.767, reward structure: {'HEALTH': '-1.520', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.025', 'AMMO3': '0.044', 'AMMO4': '0.123', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.232', 'WEAPON3': '0.400', 'weapon4': '0.776', 'weapon5': '0.902', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon3': '1.378'} +[2023-09-14 12:46:45,890][102003] DAMAGECOUNT value on done: 698.0 +[2023-09-14 12:46:45,891][102003] DAMAGECOUNT value on done: 440.0 +[2023-09-14 12:46:45,891][102003] Sum rewards: 5.899, reward structure: {'HEALTH': '-0.400', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.426', 'weapon3': '0.830', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.000', 'weapon5': '2.748'} +[2023-09-14 12:46:46,556][102001] DAMAGECOUNT value on done: 730.0 +[2023-09-14 12:46:46,556][102001] DAMAGECOUNT value on done: 973.0 +[2023-09-14 12:46:46,557][102001] Sum rewards: 7.940, reward structure: {'DEATHCOUNT': '-4.000', 'HEALTH': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.025', 'AMMO4': '0.026', 'weapon5': '0.102', 'AMMO3': '0.129', 'weapon4': '0.154', 'WEAPON4': '0.200', 'WEAPON5': '0.500', 'weapon2': '0.732', 'WEAPON3': '1.000', 'weapon3': '2.916', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.150'} +[2023-09-14 12:46:46,557][102001] Sum rewards: 4.155, reward structure: {'HEALTH': '-5.000', 'DEATHCOUNT': '-5.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.046', 'weapon2': '0.080', 'weapon5': '0.082', 'AMMO3': '0.131', 'AMMO4': '0.232', 'WEAPON5': '0.400', 'WEAPON4': '0.500', 'weapon4': '0.560', 'WEAPON3': '1.000', 'weapon3': '3.004', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.100'} +[2023-09-14 12:46:47,153][102001] DAMAGECOUNT value on done: 351.0 +[2023-09-14 12:46:47,153][102001] DAMAGECOUNT value on done: 485.0 +[2023-09-14 12:46:47,153][102001] Sum rewards: 5.034, reward structure: {'HEALTH': '-1.410', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.020', 'AMMO3': '0.039', 'weapon2': '0.070', 'AMMO4': '0.100', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.872', 'FRAGCOUNT': '0.999', 'weapon5': '1.198', 'weapon3': '1.536', 'DAMAGECOUNT': '1.800'} +[2023-09-14 12:46:49,577][109198] Fps is (10 sec: 13926.4, 60 sec: 14063.0, 300 sec: 13372.3). Total num frames: 12357632. Throughput: 0: 1852.6, 1: 1694.1. Samples: 558544. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:46:49,579][109198] Avg episode reward: [(0, '4.486'), (1, '3.350')] +[2023-09-14 12:46:49,586][101718] Saving new best policy, reward=4.486! +[2023-09-14 12:46:50,176][101965] Updated weights for policy 0, policy_version 1915 (0.0014) +[2023-09-14 12:46:51,306][101964] Updated weights for policy 1, policy_version 1107 (0.0012) +[2023-09-14 12:46:54,577][109198] Fps is (10 sec: 13516.8, 60 sec: 14131.2, 300 sec: 13388.1). Total num frames: 12427264. Throughput: 0: 1847.7, 1: 1690.1. Samples: 579719. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:46:54,579][109198] Avg episode reward: [(0, '4.486'), (1, '3.350')] +[2023-09-14 12:46:55,709][101965] Updated weights for policy 0, policy_version 1925 (0.0013) +[2023-09-14 12:46:57,220][101964] Updated weights for policy 1, policy_version 1117 (0.0013) +[2023-09-14 12:46:59,577][109198] Fps is (10 sec: 14335.9, 60 sec: 14199.5, 300 sec: 13425.8). Total num frames: 12500992. Throughput: 0: 1843.5, 1: 1691.2. Samples: 601229. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:46:59,579][109198] Avg episode reward: [(0, '4.486'), (1, '3.350')] +[2023-09-14 12:47:01,112][101965] Updated weights for policy 0, policy_version 1935 (0.0013) +[2023-09-14 12:47:03,180][101964] Updated weights for policy 1, policy_version 1127 (0.0013) +[2023-09-14 12:47:04,577][109198] Fps is (10 sec: 14745.5, 60 sec: 14199.5, 300 sec: 13461.5). Total num frames: 12574720. Throughput: 0: 1843.4, 1: 1693.2. Samples: 611763. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:47:04,579][109198] Avg episode reward: [(0, '4.486'), (1, '3.350')] +[2023-09-14 12:47:05,598][102004] DAMAGECOUNT value on done: 1286.0 +[2023-09-14 12:47:05,598][102004] DAMAGECOUNT value on done: 739.0 +[2023-09-14 12:47:05,599][102004] Sum rewards: 8.817, reward structure: {'HEALTH': '-2.800', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'weapon4': '0.036', 'AMMO3': '0.059', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon5': '0.608', 'weapon2': '0.848', 'weapon3': '2.420', 'FRAGCOUNT': '3.999', 'DAMAGECOUNT': '4.650'} +[2023-09-14 12:47:05,599][102004] Sum rewards: 0.665, reward structure: {'HEALTH': '-4.500', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.035', 'weapon5': '0.098', 'AMMO3': '0.129', 'weapon4': '0.154', 'AMMO4': '0.175', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'weapon2': '0.726', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '2.450', 'weapon3': '2.678'} +[2023-09-14 12:47:06,105][102004] DAMAGECOUNT value on done: 880.0 +[2023-09-14 12:47:06,105][102004] DAMAGECOUNT value on done: 1000.0 +[2023-09-14 12:47:06,106][102004] Sum rewards: 7.617, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.012', 'AMMO5': '0.015', 'AMMO4': '0.058', 'AMMO3': '0.060', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon2': '0.378', 'weapon5': '0.460', 'weapon4': '0.548', 'WEAPON3': '0.600', 'weapon3': '2.436', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.450'} +[2023-09-14 12:47:06,106][102004] Sum rewards: 3.607, reward structure: {'HEALTH': '-4.400', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.040', 'weapon5': '0.044', 'AMMO3': '0.122', 'weapon4': '0.130', 'AMMO4': '0.199', 'WEAPON4': '0.300', 'weapon2': '0.486', 'WEAPON5': '0.500', 'WEAPON3': '1.000', 'FRAGCOUNT': '3.000', 'weapon3': '3.060', 'DAMAGECOUNT': '3.100'} +[2023-09-14 12:47:06,610][101965] Updated weights for policy 0, policy_version 1945 (0.0012) +[2023-09-14 12:47:08,453][102037] DAMAGECOUNT value on done: 730.0 +[2023-09-14 12:47:08,453][102037] DAMAGECOUNT value on done: 1061.0 +[2023-09-14 12:47:08,454][102037] Sum rewards: 3.590, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.031', 'AMMO3': '0.085', 'AMMO4': '0.156', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon2': '0.394', 'weapon4': '0.514', 'WEAPON3': '0.700', 'weapon5': '0.722', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150', 'weapon3': '2.222'} +[2023-09-14 12:47:08,454][102037] Sum rewards: 7.428, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.025', 'AMMO3': '0.060', 'AMMO4': '0.122', 'WEAPON4': '0.200', 'weapon2': '0.276', 'WEAPON5': '0.300', 'weapon4': '0.460', 'WEAPON3': '0.600', 'weapon5': '0.902', 'weapon3': '2.318', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.150'} +[2023-09-14 12:47:08,898][101964] Updated weights for policy 1, policy_version 1137 (0.0012) +[2023-09-14 12:47:09,011][102037] DAMAGECOUNT value on done: 746.0 +[2023-09-14 12:47:09,012][102037] DAMAGECOUNT value on done: 570.0 +[2023-09-14 12:47:09,327][102037] DAMAGECOUNT value on done: 1210.0 +[2023-09-14 12:47:09,327][102037] DAMAGECOUNT value on done: 1125.0 +[2023-09-14 12:47:09,328][102037] Sum rewards: 9.155, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.020', 'AMMO3': '0.059', 'AMMO4': '0.098', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.314', 'weapon2': '0.484', 'WEAPON3': '0.600', 'weapon5': '0.894', 'weapon3': '2.170', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.100'} +[2023-09-14 12:47:09,328][102037] Sum rewards: 1.724, reward structure: {'DEATHCOUNT': '-4.000', 'HEALTH': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.017', 'AMMO4': '0.086', 'AMMO3': '0.125', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon5': '0.312', 'weapon2': '0.506', 'weapon4': '0.586', 'WEAPON3': '0.900', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.250', 'weapon3': '2.326'} +[2023-09-14 12:47:09,577][109198] Fps is (10 sec: 14745.7, 60 sec: 14267.7, 300 sec: 13495.3). Total num frames: 12648448. Throughput: 0: 1858.3, 1: 1710.1. Samples: 633919. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:47:09,579][109198] Avg episode reward: [(0, '4.590'), (1, '3.367')] +[2023-09-14 12:47:09,585][101718] Saving new best policy, reward=4.590! +[2023-09-14 12:47:09,902][102037] DAMAGECOUNT value on done: 735.0 +[2023-09-14 12:47:09,902][102037] DAMAGECOUNT value on done: 684.0 +[2023-09-14 12:47:09,903][102037] Sum rewards: 5.445, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.025', 'AMMO3': '0.043', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.306', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon3': '1.466', 'DAMAGECOUNT': '1.600', 'weapon5': '2.290'} +[2023-09-14 12:47:09,903][102037] Sum rewards: 3.219, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.010', 'AMMO3': '0.035', 'AMMO4': '0.047', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon2': '0.134', 'WEAPON3': '0.300', 'weapon4': '0.436', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.058', 'weapon5': '1.596'} +[2023-09-14 12:47:10,483][102005] DAMAGECOUNT value on done: 490.0 +[2023-09-14 12:47:10,483][102005] DAMAGECOUNT value on done: 376.0 +[2023-09-14 12:47:11,057][102005] DAMAGECOUNT value on done: 770.0 +[2023-09-14 12:47:11,057][102005] DAMAGECOUNT value on done: 1123.0 +[2023-09-14 12:47:11,058][102005] Sum rewards: 3.041, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.010', 'AMMO4': '0.033', 'AMMO3': '0.052', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.394', 'WEAPON3': '0.400', 'weapon2': '0.416', 'DAMAGECOUNT': '0.600', 'weapon3': '0.920', 'weapon5': '1.810'} +[2023-09-14 12:47:11,058][102005] Sum rewards: 2.824, reward structure: {'HEALTH': '-1.350', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.022', 'AMMO3': '0.031', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.111', 'WEAPON3': '0.300', 'weapon4': '0.676', 'weapon2': '0.772', 'DAMAGECOUNT': '0.900', 'weapon5': '1.046', 'weapon3': '1.112'} +[2023-09-14 12:47:12,018][101965] Updated weights for policy 0, policy_version 1955 (0.0014) +[2023-09-14 12:47:12,395][102040] DAMAGECOUNT value on done: 905.0 +[2023-09-14 12:47:12,396][102040] DAMAGECOUNT value on done: 730.0 +[2023-09-14 12:47:12,396][102040] Sum rewards: 6.060, reward structure: {'HEALTH': '-1.250', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.050', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.326', 'WEAPON3': '0.400', 'weapon4': '0.566', 'weapon5': '0.830', 'weapon3': '1.580', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:47:12,896][102040] DAMAGECOUNT value on done: 342.0 +[2023-09-14 12:47:12,896][102040] DAMAGECOUNT value on done: 542.0 +[2023-09-14 12:47:12,897][102040] Sum rewards: 5.455, reward structure: {'HEALTH': '-0.700', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.344', 'weapon3': '0.674', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.290', 'weapon5': '2.552'} +[2023-09-14 12:47:14,577][109198] Fps is (10 sec: 14336.1, 60 sec: 14199.5, 300 sec: 13506.3). Total num frames: 12718080. Throughput: 0: 1869.4, 1: 1722.1. Samples: 655810. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:47:14,578][109198] Avg episode reward: [(0, '4.593'), (1, '3.349')] +[2023-09-14 12:47:14,580][101718] Saving new best policy, reward=4.593! +[2023-09-14 12:47:14,791][101964] Updated weights for policy 1, policy_version 1147 (0.0011) +[2023-09-14 12:47:14,824][102005] DAMAGECOUNT value on done: 662.0 +[2023-09-14 12:47:14,824][102005] DAMAGECOUNT value on done: 567.0 +[2023-09-14 12:47:15,289][102004] DAMAGECOUNT value on done: 1356.0 +[2023-09-14 12:47:15,289][102004] DAMAGECOUNT value on done: 886.0 +[2023-09-14 12:47:15,290][102004] Sum rewards: 6.789, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.012', 'AMMO3': '0.077', 'WEAPON4': '0.100', 'weapon5': '0.230', 'WEAPON5': '0.300', 'weapon4': '0.322', 'weapon2': '0.462', 'WEAPON3': '0.700', 'weapon3': '2.496', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.090'} +[2023-09-14 12:47:15,290][102004] Sum rewards: 4.107, reward structure: {'HEALTH': '-4.040', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.030', 'AMMO3': '0.126', 'weapon2': '0.132', 'AMMO4': '0.150', 'weapon5': '0.372', 'WEAPON4': '0.400', 'weapon4': '0.412', 'WEAPON5': '0.500', 'WEAPON3': '1.000', 'weapon3': '3.000', 'DAMAGECOUNT': '3.000', 'FRAGCOUNT': '3.000'} +[2023-09-14 12:47:15,339][102005] DAMAGECOUNT value on done: 1200.0 +[2023-09-14 12:47:15,340][102005] DAMAGECOUNT value on done: 1295.0 +[2023-09-14 12:47:15,340][102005] Sum rewards: 6.857, reward structure: {'DEATHCOUNT': '-4.000', 'HEALTH': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.036', 'AMMO3': '0.135', 'AMMO4': '0.181', 'weapon2': '0.202', 'WEAPON4': '0.400', 'weapon5': '0.414', 'weapon4': '0.486', 'WEAPON5': '0.500', 'WEAPON3': '1.000', 'weapon3': '2.728', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.750'} +[2023-09-14 12:47:15,341][102005] Sum rewards: 5.865, reward structure: {'HEALTH': '-4.500', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.029', 'AMMO3': '0.136', 'AMMO4': '0.143', 'weapon2': '0.144', 'WEAPON4': '0.400', 'weapon4': '0.456', 'WEAPON5': '0.500', 'weapon5': '0.574', 'WEAPON3': '1.000', 'weapon3': '2.658', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.300'} +[2023-09-14 12:47:15,879][102004] DAMAGECOUNT value on done: 779.0 +[2023-09-14 12:47:15,879][102004] DAMAGECOUNT value on done: 845.0 +[2023-09-14 12:47:15,880][102004] Sum rewards: 6.730, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.692', 'weapon3': '1.442', 'weapon5': '1.906', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:47:15,880][102004] Sum rewards: 2.850, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.012', 'AMMO4': '0.057', 'AMMO3': '0.072', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.334', 'WEAPON3': '0.600', 'weapon4': '0.632', 'weapon2': '0.836', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.896'} +[2023-09-14 12:47:16,657][102040] DAMAGECOUNT value on done: 940.0 +[2023-09-14 12:47:16,657][102040] DAMAGECOUNT value on done: 645.0 +[2023-09-14 12:47:16,657][102040] Sum rewards: 1.717, reward structure: {'HEALTH': '-2.750', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.022', 'AMMO3': '0.071', 'WEAPON5': '0.100', 'AMMO4': '0.108', 'WEAPON4': '0.200', 'WEAPON3': '0.500', 'weapon4': '0.512', 'weapon2': '0.736', 'weapon5': '0.876', 'FRAGCOUNT': '1.000', 'weapon3': '1.086', 'DAMAGECOUNT': '1.250'} +[2023-09-14 12:47:16,658][102040] Sum rewards: 5.598, reward structure: {'HEALTH': '-2.150', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.020', 'AMMO3': '0.066', 'AMMO4': '0.099', 'WEAPON5': '0.200', 'weapon2': '0.264', 'weapon5': '0.284', 'WEAPON4': '0.300', 'WEAPON3': '0.600', 'weapon4': '1.002', 'FRAGCOUNT': '1.999', 'weapon3': '2.106', 'DAMAGECOUNT': '2.800'} +[2023-09-14 12:47:17,305][102040] DAMAGECOUNT value on done: 905.0 +[2023-09-14 12:47:17,306][102040] Sum rewards: 4.357, reward structure: {'HEALTH': '-3.900', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.015', 'AMMO4': '0.022', 'AMMO3': '0.081', 'WEAPON4': '0.100', 'weapon4': '0.210', 'WEAPON5': '0.300', 'weapon2': '0.420', 'WEAPON3': '0.700', 'weapon5': '1.000', 'weapon3': '2.304', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.100'} +[2023-09-14 12:47:17,305][102040] DAMAGECOUNT value on done: 945.0 +[2023-09-14 12:47:17,306][102040] Sum rewards: 6.396, reward structure: {'HEALTH': '-3.100', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.016', 'AMMO5': '0.020', 'weapon2': '0.050', 'AMMO4': '0.079', 'AMMO3': '0.097', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'weapon5': '0.450', 'weapon4': '0.742', 'WEAPON3': '0.800', 'weapon3': '2.542', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '4.000'} +[2023-09-14 12:47:17,583][101965] Updated weights for policy 0, policy_version 1965 (0.0013) +[2023-09-14 12:47:19,577][109198] Fps is (10 sec: 13926.3, 60 sec: 14199.5, 300 sec: 13516.8). Total num frames: 12787712. Throughput: 0: 1861.9, 1: 1717.3. Samples: 666326. Policy #0 lag: (min: 0.0, avg: 0.8, max: 3.0) +[2023-09-14 12:47:19,579][109198] Avg episode reward: [(0, '4.559'), (1, '3.316')] +[2023-09-14 12:47:20,693][102039] DAMAGECOUNT value on done: 670.0 +[2023-09-14 12:47:20,693][102039] DAMAGECOUNT value on done: 510.0 +[2023-09-14 12:47:20,694][102039] Sum rewards: 4.843, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.014', 'AMMO3': '0.045', 'AMMO4': '0.068', 'WEAPON4': '0.100', 'weapon4': '0.136', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.778', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '1.428', 'weapon5': '1.564'} +[2023-09-14 12:47:20,694][102039] Sum rewards: 4.533, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.027', 'AMMO3': '0.048', 'WEAPON5': '0.100', 'AMMO4': '0.136', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.602', 'weapon2': '0.604', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.112', 'weapon5': '1.298'} +[2023-09-14 12:47:20,789][101964] Updated weights for policy 1, policy_version 1157 (0.0012) +[2023-09-14 12:47:21,283][102039] DAMAGECOUNT value on done: 834.0 +[2023-09-14 12:47:21,283][102039] DAMAGECOUNT value on done: 1472.0 +[2023-09-14 12:47:21,284][102039] Sum rewards: 2.689, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.022', 'AMMO3': '0.068', 'WEAPON5': '0.100', 'AMMO4': '0.112', 'WEAPON4': '0.200', 'WEAPON3': '0.500', 'weapon2': '0.626', 'weapon4': '0.666', 'weapon5': '0.930', 'weapon3': '1.320', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.140'} +[2023-09-14 12:47:21,284][102039] Sum rewards: 6.659, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.013', 'AMMO4': '0.065', 'AMMO3': '0.071', 'WEAPON5': '0.200', 'weapon5': '0.234', 'WEAPON4': '0.300', 'WEAPON3': '0.600', 'weapon4': '0.636', 'weapon2': '0.694', 'weapon3': '1.836', 'DAMAGECOUNT': '3.000', 'FRAGCOUNT': '3.000'} +[2023-09-14 12:47:21,612][102046] DAMAGECOUNT value on done: 695.0 +[2023-09-14 12:47:21,613][102046] DAMAGECOUNT value on done: 775.0 +[2023-09-14 12:47:22,295][102046] DAMAGECOUNT value on done: 773.0 +[2023-09-14 12:47:22,296][102046] DAMAGECOUNT value on done: 1195.0 +[2023-09-14 12:47:22,296][102046] Sum rewards: 7.775, reward structure: {'HEALTH': '-1.450', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO3': '0.030', 'AMMO2': '0.040', 'AMMO4': '0.200', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.360', 'weapon5': '0.818', 'weapon4': '0.986', 'weapon3': '1.334', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '3.750'} +[2023-09-14 12:47:22,477][102039] DAMAGECOUNT value on done: 885.0 +[2023-09-14 12:47:22,477][102039] DAMAGECOUNT value on done: 459.0 +[2023-09-14 12:47:22,478][102039] Sum rewards: 6.141, reward structure: {'HEALTH': '-0.700', 'AMMO4': '-0.000', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.126', 'WEAPON3': '0.200', 'weapon2': '0.296', 'weapon3': '0.784', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.450', 'weapon5': '2.760'} +[2023-09-14 12:47:22,817][102001] DAMAGECOUNT value on done: 435.0 +[2023-09-14 12:47:22,818][102001] DAMAGECOUNT value on done: 535.0 +[2023-09-14 12:47:22,985][101965] Updated weights for policy 0, policy_version 1975 (0.0012) +[2023-09-14 12:47:23,037][102039] DAMAGECOUNT value on done: 753.0 +[2023-09-14 12:47:23,037][102039] DAMAGECOUNT value on done: 892.0 +[2023-09-14 12:47:23,038][102039] Sum rewards: 6.060, reward structure: {'HEALTH': '-0.700', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO3': '0.020', 'AMMO2': '0.020', 'AMMO4': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.346', 'weapon4': '0.566', 'weapon3': '0.782', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.490', 'weapon5': '2.032'} +[2023-09-14 12:47:23,365][102001] DAMAGECOUNT value on done: 400.0 +[2023-09-14 12:47:23,365][102001] DAMAGECOUNT value on done: 631.0 +[2023-09-14 12:47:23,366][102001] Sum rewards: 5.881, reward structure: {'HEALTH': '-0.320', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.015', 'AMMO3': '0.020', 'AMMO4': '0.075', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.352', 'weapon2': '0.684', 'weapon3': '0.746', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.270', 'weapon5': '1.636'} +[2023-09-14 12:47:23,407][102046] DAMAGECOUNT value on done: 425.0 +[2023-09-14 12:47:23,408][102046] DAMAGECOUNT value on done: 484.0 +[2023-09-14 12:47:23,408][102046] Sum rewards: 4.474, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.018', 'AMMO3': '0.042', 'AMMO4': '0.090', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.510', 'weapon5': '0.522', 'weapon2': '0.836', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.300', 'weapon3': '1.346'} +[2023-09-14 12:47:23,408][102046] Sum rewards: 2.944, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.025', 'AMMO3': '0.030', 'weapon5': '0.080', 'WEAPON5': '0.100', 'AMMO4': '0.122', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.422', 'weapon2': '0.684', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.126'} +[2023-09-14 12:47:23,729][102003] DAMAGECOUNT value on done: 810.0 +[2023-09-14 12:47:23,729][102003] DAMAGECOUNT value on done: 1070.0 +[2023-09-14 12:47:23,730][102003] Sum rewards: 10.397, reward structure: {'HEALTH': '-2.700', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.060', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon2': '0.362', 'weapon4': '0.552', 'WEAPON3': '0.600', 'weapon5': '0.658', 'weapon3': '2.250', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.100'} +[2023-09-14 12:47:23,729][102003] Sum rewards: 0.844, reward structure: {'DEATHCOUNT': '-5.000', 'HEALTH': '-5.000', 'HITCOUNT': '0.000', 'AMMO2': '0.023', 'AMMO5': '0.025', 'AMMO4': '0.117', 'AMMO3': '0.166', 'weapon2': '0.384', 'WEAPON4': '0.400', 'WEAPON5': '0.500', 'weapon4': '0.508', 'weapon5': '0.860', 'WEAPON3': '1.100', 'FRAGCOUNT': '2.000', 'weapon3': '2.010', 'DAMAGECOUNT': '2.750'} +[2023-09-14 12:47:23,987][102046] DAMAGECOUNT value on done: 615.0 +[2023-09-14 12:47:23,987][102046] DAMAGECOUNT value on done: 926.0 +[2023-09-14 12:47:23,988][102046] Sum rewards: 3.980, reward structure: {'HEALTH': '-0.250', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'AMMO2': '0.023', 'weapon5': '0.062', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.116', 'WEAPON3': '0.200', 'weapon2': '0.220', 'weapon4': '0.568', 'weapon3': '0.658', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.160'} +[2023-09-14 12:47:24,276][102003] DAMAGECOUNT value on done: 365.0 +[2023-09-14 12:47:24,277][102003] DAMAGECOUNT value on done: 490.0 +[2023-09-14 12:47:24,278][102003] Sum rewards: 4.241, reward structure: {'HEALTH': '-1.250', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.025', 'AMMO3': '0.056', 'WEAPON5': '0.100', 'AMMO4': '0.122', 'WEAPON4': '0.200', 'weapon2': '0.214', 'WEAPON3': '0.400', 'weapon4': '0.776', 'weapon3': '0.906', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon5': '1.586'} +[2023-09-14 12:47:24,277][102003] Sum rewards: 5.021, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.314', 'weapon2': '0.344', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.250', 'weapon3': '1.510', 'weapon5': '1.854'} +[2023-09-14 12:47:24,577][109198] Fps is (10 sec: 14335.9, 60 sec: 14336.0, 300 sec: 13546.8). Total num frames: 12861440. Throughput: 0: 1861.9, 1: 1717.9. Samples: 687752. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:47:24,579][109198] Avg episode reward: [(0, '4.599'), (1, '3.420')] +[2023-09-14 12:47:24,580][101718] Saving new best policy, reward=4.599! +[2023-09-14 12:47:24,808][102001] DAMAGECOUNT value on done: 1340.0 +[2023-09-14 12:47:24,808][102001] DAMAGECOUNT value on done: 1418.0 +[2023-09-14 12:47:24,809][102001] Sum rewards: 9.775, reward structure: {'HEALTH': '-4.200', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.043', 'weapon5': '0.092', 'AMMO3': '0.127', 'weapon2': '0.190', 'AMMO4': '0.215', 'WEAPON4': '0.300', 'weapon4': '0.394', 'WEAPON5': '0.400', 'WEAPON3': '1.000', 'weapon3': '3.094', 'FRAGCOUNT': '6.000', 'DAMAGECOUNT': '6.100'} +[2023-09-14 12:47:24,809][102001] Sum rewards: 3.013, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-6.000', 'HITCOUNT': '0.000', 'AMMO5': '0.030', 'AMMO2': '0.043', 'weapon2': '0.044', 'AMMO3': '0.167', 'AMMO4': '0.213', 'weapon5': '0.244', 'WEAPON4': '0.500', 'weapon4': '0.598', 'WEAPON5': '0.600', 'WEAPON3': '1.200', 'weapon3': '2.924', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.450'} +[2023-09-14 12:47:24,822][102003] DAMAGECOUNT value on done: 963.0 +[2023-09-14 12:47:24,823][102003] Sum rewards: 8.506, reward structure: {'HEALTH': '-0.100', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.024', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.314', 'weapon3': '0.694', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050', 'weapon5': '3.094'} +[2023-09-14 12:47:24,822][102003] DAMAGECOUNT value on done: 700.0 +[2023-09-14 12:47:25,413][102003] DAMAGECOUNT value on done: 815.0 +[2023-09-14 12:47:25,413][102003] DAMAGECOUNT value on done: 530.0 +[2023-09-14 12:47:25,413][102003] Sum rewards: 4.020, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.732', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.170', 'weapon5': '1.262', 'weapon3': '1.668'} +[2023-09-14 12:47:25,414][102003] Sum rewards: 4.264, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.022', 'AMMO3': '0.040', 'AMMO4': '0.112', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.332', 'WEAPON3': '0.400', 'weapon5': '0.604', 'weapon4': '0.798', 'DAMAGECOUNT': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.746'} +[2023-09-14 12:47:25,551][102001] DAMAGECOUNT value on done: 516.0 +[2023-09-14 12:47:25,551][102001] DAMAGECOUNT value on done: 635.0 +[2023-09-14 12:47:25,552][102001] Sum rewards: 4.686, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.034', 'AMMO3': '0.040', 'AMMO4': '0.172', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.320', 'WEAPON3': '0.400', 'weapon4': '0.776', 'weapon2': '0.976', 'FRAGCOUNT': '1.000', 'weapon3': '1.408', 'DAMAGECOUNT': '1.650'} +[2023-09-14 12:47:25,552][102001] Sum rewards: 3.908, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.049', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.278', 'WEAPON3': '0.400', 'weapon2': '0.692', 'FRAGCOUNT': '1.000', 'weapon5': '1.104', 'weapon3': '1.280', 'DAMAGECOUNT': '1.500'} +[2023-09-14 12:47:26,825][101964] Updated weights for policy 1, policy_version 1167 (0.0014) +[2023-09-14 12:47:28,610][101965] Updated weights for policy 0, policy_version 1985 (0.0014) +[2023-09-14 12:47:29,577][109198] Fps is (10 sec: 14336.1, 60 sec: 14336.0, 300 sec: 13555.8). Total num frames: 12931072. Throughput: 0: 1855.2, 1: 1711.9. Samples: 708846. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:47:29,579][109198] Avg episode reward: [(0, '4.719'), (1, '3.386')] +[2023-09-14 12:47:29,585][101718] Saving new best policy, reward=4.719! +[2023-09-14 12:47:33,116][101964] Updated weights for policy 1, policy_version 1177 (0.0013) +[2023-09-14 12:47:34,112][101965] Updated weights for policy 0, policy_version 1995 (0.0013) +[2023-09-14 12:47:34,577][109198] Fps is (10 sec: 13926.4, 60 sec: 14199.9, 300 sec: 13564.4). Total num frames: 13000704. Throughput: 0: 1857.0, 1: 1710.3. Samples: 719072. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:47:34,579][109198] Avg episode reward: [(0, '4.719'), (1, '3.386')] +[2023-09-14 12:47:39,091][101964] Updated weights for policy 1, policy_version 1187 (0.0014) +[2023-09-14 12:47:39,338][102004] DAMAGECOUNT value on done: 1606.0 +[2023-09-14 12:47:39,338][102004] DAMAGECOUNT value on done: 1094.0 +[2023-09-14 12:47:39,339][102004] Sum rewards: 5.369, reward structure: {'HEALTH': '-3.400', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.013', 'AMMO5': '0.020', 'weapon2': '0.042', 'AMMO4': '0.066', 'AMMO3': '0.097', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'weapon4': '0.582', 'WEAPON3': '0.800', 'weapon5': '0.820', 'weapon3': '2.428', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.200'} +[2023-09-14 12:47:39,339][102004] Sum rewards: 5.956, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.017', 'weapon2': '0.032', 'AMMO4': '0.083', 'AMMO3': '0.085', 'weapon4': '0.286', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'WEAPON3': '0.700', 'weapon5': '1.406', 'weapon3': '2.182', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.550'} +[2023-09-14 12:47:39,577][109198] Fps is (10 sec: 13926.4, 60 sec: 14199.5, 300 sec: 13572.7). Total num frames: 13070336. Throughput: 0: 1859.9, 1: 1715.9. Samples: 740628. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:47:39,579][109198] Avg episode reward: [(0, '4.761'), (1, '3.386')] +[2023-09-14 12:47:39,586][101718] Saving new best policy, reward=4.761! +[2023-09-14 12:47:39,751][101965] Updated weights for policy 0, policy_version 2005 (0.0013) +[2023-09-14 12:47:39,914][102004] DAMAGECOUNT value on done: 1030.0 +[2023-09-14 12:47:39,914][102004] DAMAGECOUNT value on done: 1040.0 +[2023-09-14 12:47:39,914][102004] Sum rewards: 6.479, reward structure: {'HEALTH': '-0.400', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.354', 'weapon3': '0.802', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.500', 'weapon5': '2.928'} +[2023-09-14 12:47:44,577][109198] Fps is (10 sec: 14335.9, 60 sec: 14199.5, 300 sec: 13598.7). Total num frames: 13144064. Throughput: 0: 1860.3, 1: 1713.0. Samples: 762030. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:47:44,579][109198] Avg episode reward: [(0, '4.797'), (1, '3.386')] +[2023-09-14 12:47:44,605][101718] Saving new best policy, reward=4.797! +[2023-09-14 12:47:45,127][101964] Updated weights for policy 1, policy_version 1197 (0.0013) +[2023-09-14 12:47:45,194][101965] Updated weights for policy 0, policy_version 2015 (0.0013) +[2023-09-14 12:47:46,014][102037] DAMAGECOUNT value on done: 1461.0 +[2023-09-14 12:47:46,014][102037] DAMAGECOUNT value on done: 1245.0 +[2023-09-14 12:47:46,015][102037] Sum rewards: 4.050, reward structure: {'HEALTH': '-5.150', 'DEATHCOUNT': '-5.000', 'HITCOUNT': '0.000', 'AMMO2': '0.016', 'AMMO5': '0.025', 'AMMO4': '0.082', 'AMMO3': '0.170', 'weapon2': '0.224', 'WEAPON4': '0.300', 'weapon4': '0.454', 'WEAPON5': '0.500', 'weapon5': '0.572', 'WEAPON3': '1.200', 'weapon3': '2.656', 'DAMAGECOUNT': '4.000', 'FRAGCOUNT': '4.000'} +[2023-09-14 12:47:46,015][102037] Sum rewards: 7.626, reward structure: {'HEALTH': '-4.000', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.039', 'weapon2': '0.058', 'AMMO3': '0.082', 'AMMO4': '0.195', 'WEAPON5': '0.300', 'WEAPON4': '0.400', 'weapon5': '0.528', 'WEAPON3': '0.700', 'weapon4': '0.876', 'weapon3': '2.282', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.150'} +[2023-09-14 12:47:46,585][102037] DAMAGECOUNT value on done: 821.0 +[2023-09-14 12:47:46,585][102037] DAMAGECOUNT value on done: 865.0 +[2023-09-14 12:47:46,586][102037] Sum rewards: 8.577, reward structure: {'HEALTH': '-0.750', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.348', 'weapon3': '0.868', 'FRAGCOUNT': '2.000', 'weapon5': '2.866', 'DAMAGECOUNT': '2.950'} +[2023-09-14 12:47:46,928][102037] DAMAGECOUNT value on done: 1540.0 +[2023-09-14 12:47:46,929][102037] DAMAGECOUNT value on done: 1635.0 +[2023-09-14 12:47:46,929][102037] Sum rewards: 2.485, reward structure: {'HEALTH': '-5.000', 'DEATHCOUNT': '-5.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.054', 'AMMO3': '0.152', 'weapon4': '0.240', 'AMMO4': '0.271', 'weapon5': '0.306', 'WEAPON4': '0.400', 'weapon2': '0.494', 'WEAPON5': '0.500', 'WEAPON3': '1.100', 'weapon3': '2.642', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.300'} +[2023-09-14 12:47:46,930][102037] Sum rewards: 9.630, reward structure: {'HEALTH': '-3.200', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.035', 'AMMO3': '0.090', 'AMMO4': '0.173', 'weapon4': '0.292', 'WEAPON4': '0.300', 'weapon2': '0.338', 'WEAPON5': '0.400', 'weapon5': '0.458', 'WEAPON3': '0.800', 'weapon3': '2.824', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.100'} +[2023-09-14 12:47:47,639][102037] DAMAGECOUNT value on done: 835.0 +[2023-09-14 12:47:47,639][102037] DAMAGECOUNT value on done: 804.0 +[2023-09-14 12:47:47,640][102037] Sum rewards: 2.896, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.010', 'weapon2': '0.038', 'AMMO3': '0.051', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.218', 'WEAPON3': '0.400', 'weapon5': '0.822', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.256'} +[2023-09-14 12:47:47,640][102037] Sum rewards: 4.353, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.026', 'AMMO3': '0.040', 'AMMO4': '0.129', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.352', 'WEAPON3': '0.400', 'weapon5': '0.682', 'weapon4': '0.814', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.200', 'weapon3': '1.300'} +[2023-09-14 12:47:48,019][102005] DAMAGECOUNT value on done: 515.0 +[2023-09-14 12:47:48,019][102005] DAMAGECOUNT value on done: 476.0 +[2023-09-14 12:47:48,020][102005] Sum rewards: 6.069, reward structure: {'HEALTH': '-0.250', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.025', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.125', 'WEAPON3': '0.200', 'weapon2': '0.422', 'weapon4': '0.606', 'weapon3': '0.768', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon5': '1.948'} +[2023-09-14 12:47:48,669][102005] DAMAGECOUNT value on done: 854.0 +[2023-09-14 12:47:48,670][102005] DAMAGECOUNT value on done: 1208.0 +[2023-09-14 12:47:48,670][102005] Sum rewards: 3.649, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.025', 'AMMO3': '0.040', 'AMMO4': '0.125', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.290', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.840', 'weapon4': '0.850', 'weapon3': '1.204', 'weapon5': '1.468'} +[2023-09-14 12:47:49,558][102040] DAMAGECOUNT value on done: 1060.0 +[2023-09-14 12:47:49,558][102040] DAMAGECOUNT value on done: 845.0 +[2023-09-14 12:47:49,559][102040] Sum rewards: 5.192, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.020', 'AMMO3': '0.052', 'AMMO4': '0.099', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.532', 'weapon2': '0.946', 'FRAGCOUNT': '1.000', 'weapon3': '1.018', 'weapon5': '1.414', 'DAMAGECOUNT': '1.550'} +[2023-09-14 12:47:49,559][102040] Sum rewards: 4.252, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.704', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon3': '1.438', 'weapon5': '1.870'} +[2023-09-14 12:47:49,577][109198] Fps is (10 sec: 14336.1, 60 sec: 14267.7, 300 sec: 13605.9). Total num frames: 13213696. Throughput: 0: 1862.4, 1: 1714.2. Samples: 772709. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:47:49,578][109198] Avg episode reward: [(0, '4.853'), (1, '3.430')] +[2023-09-14 12:47:49,586][101802] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001204_4931584.pth... +[2023-09-14 12:47:49,586][101718] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002022_8282112.pth... +[2023-09-14 12:47:49,646][101802] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000837_3428352.pth +[2023-09-14 12:47:49,648][101718] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001625_6656000.pth +[2023-09-14 12:47:49,656][101718] Saving new best policy, reward=4.853! +[2023-09-14 12:47:50,208][102040] DAMAGECOUNT value on done: 342.0 +[2023-09-14 12:47:50,208][102040] DAMAGECOUNT value on done: 617.0 +[2023-09-14 12:47:50,751][101965] Updated weights for policy 0, policy_version 2025 (0.0014) +[2023-09-14 12:47:51,119][101964] Updated weights for policy 1, policy_version 1207 (0.0011) +[2023-09-14 12:47:52,144][102004] DAMAGECOUNT value on done: 1561.0 +[2023-09-14 12:47:52,145][102004] DAMAGECOUNT value on done: 1296.0 +[2023-09-14 12:47:52,145][102004] Sum rewards: 0.112, reward structure: {'HEALTH': '-5.000', 'DEATHCOUNT': '-5.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'weapon2': '0.030', 'AMMO2': '0.033', 'AMMO3': '0.152', 'AMMO4': '0.163', 'WEAPON4': '0.400', 'WEAPON5': '0.500', 'weapon4': '0.602', 'WEAPON3': '1.000', 'weapon5': '1.072', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.050', 'weapon3': '2.086'} +[2023-09-14 12:47:52,145][102004] Sum rewards: 9.116, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.008', 'AMMO5': '0.015', 'weapon4': '0.040', 'AMMO4': '0.042', 'AMMO3': '0.062', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.696', 'weapon5': '0.936', 'weapon3': '2.216', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.100'} +[2023-09-14 12:47:52,282][102005] DAMAGECOUNT value on done: 702.0 +[2023-09-14 12:47:52,283][102005] DAMAGECOUNT value on done: 602.0 +[2023-09-14 12:47:52,643][102004] DAMAGECOUNT value on done: 1014.0 +[2023-09-14 12:47:52,643][102004] DAMAGECOUNT value on done: 1000.0 +[2023-09-14 12:47:52,644][102004] Sum rewards: 6.334, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.032', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.159', 'WEAPON3': '0.200', 'weapon2': '0.278', 'weapon3': '0.640', 'weapon4': '0.714', 'FRAGCOUNT': '2.000', 'weapon5': '2.236', 'DAMAGECOUNT': '2.350'} +[2023-09-14 12:47:52,645][102004] Sum rewards: 3.037, reward structure: {'HEALTH': '-2.350', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO4': '0.001', 'AMMO5': '0.015', 'AMMO3': '0.040', 'weapon4': '0.060', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'WEAPON3': '0.400', 'weapon2': '0.568', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.550', 'weapon3': '1.614', 'weapon5': '1.738'} +[2023-09-14 12:47:52,783][102005] DAMAGECOUNT value on done: 1570.0 +[2023-09-14 12:47:52,783][102005] DAMAGECOUNT value on done: 1595.0 +[2023-09-14 12:47:52,784][102005] Sum rewards: 6.977, reward structure: {'HEALTH': '-2.900', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.015', 'AMMO4': '0.019', 'AMMO3': '0.071', 'WEAPON4': '0.200', 'weapon4': '0.250', 'WEAPON5': '0.300', 'weapon2': '0.346', 'WEAPON3': '0.600', 'weapon5': '1.524', 'weapon3': '1.848', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.700'} +[2023-09-14 12:47:52,784][102005] Sum rewards: 2.610, reward structure: {'DEATHCOUNT': '-4.000', 'HEALTH': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.032', 'AMMO3': '0.119', 'AMMO4': '0.158', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.304', 'weapon2': '0.412', 'weapon5': '0.532', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.999', 'weapon3': '2.540', 'DAMAGECOUNT': '3.000'} +[2023-09-14 12:47:53,767][102040] DAMAGECOUNT value on done: 1040.0 +[2023-09-14 12:47:53,767][102040] DAMAGECOUNT value on done: 710.0 +[2023-09-14 12:47:53,767][102040] Sum rewards: 5.903, reward structure: {'HEALTH': '-0.650', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.025', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.125', 'WEAPON3': '0.200', 'weapon4': '0.326', 'weapon2': '0.610', 'weapon3': '0.698', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon5': '2.344'} +[2023-09-14 12:47:54,393][102040] DAMAGECOUNT value on done: 1330.0 +[2023-09-14 12:47:54,393][102040] DAMAGECOUNT value on done: 1455.0 +[2023-09-14 12:47:54,394][102040] Sum rewards: 4.287, reward structure: {'DEATHCOUNT': '-5.000', 'HEALTH': '-5.000', 'HITCOUNT': '0.000', 'AMMO2': '0.009', 'AMMO5': '0.025', 'AMMO4': '0.045', 'AMMO3': '0.166', 'WEAPON4': '0.400', 'weapon2': '0.480', 'WEAPON5': '0.500', 'weapon4': '0.560', 'weapon5': '0.596', 'WEAPON3': '1.100', 'weapon3': '2.156', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.250'} +[2023-09-14 12:47:54,394][102040] Sum rewards: 8.088, reward structure: {'DEATHCOUNT': '-4.000', 'HEALTH': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.027', 'AMMO4': '0.134', 'AMMO3': '0.135', 'weapon5': '0.152', 'weapon4': '0.356', 'WEAPON5': '0.400', 'WEAPON4': '0.400', 'weapon2': '0.602', 'WEAPON3': '1.000', 'weapon3': '2.762', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.100'} +[2023-09-14 12:47:54,577][109198] Fps is (10 sec: 14336.1, 60 sec: 14336.0, 300 sec: 13630.1). Total num frames: 13287424. Throughput: 0: 1854.4, 1: 1700.7. Samples: 793900. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:47:54,579][109198] Avg episode reward: [(0, '4.863'), (1, '3.462')] +[2023-09-14 12:47:54,580][101718] Saving new best policy, reward=4.863! +[2023-09-14 12:47:56,219][101965] Updated weights for policy 0, policy_version 2035 (0.0012) +[2023-09-14 12:47:57,217][101964] Updated weights for policy 1, policy_version 1217 (0.0014) +[2023-09-14 12:47:59,577][109198] Fps is (10 sec: 14745.5, 60 sec: 14336.0, 300 sec: 13653.3). Total num frames: 13361152. Throughput: 0: 1849.2, 1: 1696.0. Samples: 815342. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:47:59,579][109198] Avg episode reward: [(0, '4.863'), (1, '3.462')] +[2023-09-14 12:48:00,093][102039] DAMAGECOUNT value on done: 770.0 +[2023-09-14 12:48:00,093][102039] DAMAGECOUNT value on done: 530.0 +[2023-09-14 12:48:00,094][102039] Sum rewards: 6.245, reward structure: {'HEALTH': '-0.200', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.694', 'weapon3': '0.762', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon5': '2.664'} +[2023-09-14 12:48:00,216][102046] DAMAGECOUNT value on done: 815.0 +[2023-09-14 12:48:00,216][102046] DAMAGECOUNT value on done: 935.0 +[2023-09-14 12:48:00,216][102046] Sum rewards: 4.125, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.038', 'AMMO3': '0.040', 'AMMO4': '0.187', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.370', 'WEAPON3': '0.400', 'weapon4': '0.786', 'FRAGCOUNT': '1.000', 'weapon5': '1.000', 'weapon3': '1.194', 'DAMAGECOUNT': '1.200'} +[2023-09-14 12:48:00,217][102046] Sum rewards: 3.447, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.061', 'AMMO2': '-0.012', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'AMMO3': '0.060', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.906', 'weapon5': '0.980', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.600', 'weapon3': '2.062'} +[2023-09-14 12:48:00,642][102039] DAMAGECOUNT value on done: 1009.0 +[2023-09-14 12:48:00,642][102039] DAMAGECOUNT value on done: 1706.0 +[2023-09-14 12:48:00,643][102039] Sum rewards: 3.694, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.024', 'weapon2': '0.032', 'AMMO3': '0.060', 'AMMO4': '0.120', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.600', 'weapon5': '0.908', 'weapon4': '0.968', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.750', 'weapon3': '1.822'} +[2023-09-14 12:48:00,643][102039] Sum rewards: 5.912, reward structure: {'HEALTH': '-1.750', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.040', 'weapon2': '0.042', 'AMMO4': '0.099', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.796', 'weapon5': '1.236', 'weapon3': '1.384', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.340'} +[2023-09-14 12:48:00,773][102046] DAMAGECOUNT value on done: 898.0 +[2023-09-14 12:48:00,773][102046] DAMAGECOUNT value on done: 1355.0 +[2023-09-14 12:48:00,773][102046] Sum rewards: 3.589, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.020', 'weapon2': '0.024', 'AMMO3': '0.030', 'AMMO4': '0.099', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.790', 'weapon3': '0.916', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.250', 'weapon5': '1.350'} +[2023-09-14 12:48:00,774][102046] Sum rewards: 5.202, reward structure: {'HEALTH': '-1.250', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.050', 'weapon2': '0.150', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.576', 'FRAGCOUNT': '1.000', 'weapon3': '1.270', 'DAMAGECOUNT': '1.600', 'weapon5': '1.946'} +[2023-09-14 12:48:01,671][101965] Updated weights for policy 0, policy_version 2045 (0.0013) +[2023-09-14 12:48:02,026][102039] DAMAGECOUNT value on done: 1055.0 +[2023-09-14 12:48:02,027][102039] DAMAGECOUNT value on done: 679.0 +[2023-09-14 12:48:02,027][102039] Sum rewards: 3.794, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.060', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.302', 'weapon2': '0.540', 'WEAPON3': '0.600', 'weapon5': '0.900', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.700', 'weapon3': '2.190'} +[2023-09-14 12:48:02,028][102039] Sum rewards: 6.120, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.020', 'AMMO3': '0.040', 'AMMO4': '0.100', 'weapon2': '0.126', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.792', 'weapon3': '1.226', 'weapon5': '1.406', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.200'} +[2023-09-14 12:48:02,038][102046] DAMAGECOUNT value on done: 525.0 +[2023-09-14 12:48:02,038][102046] DAMAGECOUNT value on done: 539.0 +[2023-09-14 12:48:02,038][102046] Sum rewards: 4.861, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.029', 'AMMO3': '0.055', 'WEAPON5': '0.100', 'AMMO4': '0.145', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.456', 'weapon4': '0.492', 'weapon3': '0.786', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon5': '2.196'} +[2023-09-14 12:48:02,072][102003] DAMAGECOUNT value on done: 1410.0 +[2023-09-14 12:48:02,072][102003] DAMAGECOUNT value on done: 1115.0 +[2023-09-14 12:48:02,073][102003] Sum rewards: 5.786, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.006', 'AMMO5': '0.020', 'AMMO4': '0.030', 'AMMO3': '0.089', 'WEAPON4': '0.200', 'weapon5': '0.264', 'WEAPON5': '0.400', 'weapon2': '0.422', 'weapon4': '0.426', 'WEAPON3': '0.800', 'weapon3': '2.728', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.400'} +[2023-09-14 12:48:02,073][102003] Sum rewards: 5.061, reward structure: {'HEALTH': '-3.350', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.014', 'AMMO5': '0.015', 'weapon2': '0.044', 'AMMO4': '0.069', 'AMMO3': '0.087', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'WEAPON3': '0.700', 'weapon4': '0.750', 'weapon5': '1.158', 'weapon3': '1.924', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.050'} +[2023-09-14 12:48:02,120][102001] DAMAGECOUNT value on done: 745.0 +[2023-09-14 12:48:02,121][102001] Sum rewards: 7.254, reward structure: {'HEALTH': '-2.150', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.006', 'AMMO2': '0.014', 'AMMO5': '0.015', 'AMMO3': '0.066', 'AMMO4': '0.068', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon4': '0.544', 'WEAPON3': '0.600', 'weapon5': '1.636', 'weapon3': '1.754', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.100'} +[2023-09-14 12:48:02,120][102001] DAMAGECOUNT value on done: 755.0 +[2023-09-14 12:48:02,122][102001] Sum rewards: 3.417, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.024', 'AMMO3': '0.090', 'AMMO4': '0.119', 'weapon2': '0.228', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon5': '0.620', 'WEAPON3': '0.700', 'weapon4': '1.096', 'weapon3': '1.724', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.200'} +[2023-09-14 12:48:02,609][102039] DAMAGECOUNT value on done: 878.0 +[2023-09-14 12:48:02,609][102039] DAMAGECOUNT value on done: 1047.0 +[2023-09-14 12:48:02,610][102039] Sum rewards: 4.880, reward structure: {'HEALTH': '-1.450', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'weapon2': '0.028', 'AMMO2': '0.040', 'AMMO3': '0.043', 'AMMO4': '0.199', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.804', 'FRAGCOUNT': '1.000', 'weapon3': '1.192', 'DAMAGECOUNT': '1.250', 'weapon5': '1.964'} +[2023-09-14 12:48:02,610][102039] Sum rewards: 5.198, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.412', 'FRAGCOUNT': '1.000', 'weapon3': '1.124', 'DAMAGECOUNT': '1.550', 'weapon5': '2.462'} +[2023-09-14 12:48:02,624][102046] DAMAGECOUNT value on done: 1251.0 +[2023-09-14 12:48:02,625][102046] DAMAGECOUNT value on done: 850.0 +[2023-09-14 12:48:02,625][102046] Sum rewards: 6.401, reward structure: {'HEALTH': '-2.200', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.025', 'AMMO3': '0.055', 'WEAPON5': '0.100', 'AMMO4': '0.125', 'weapon5': '0.264', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon2': '0.518', 'weapon4': '0.974', 'weapon3': '1.484', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.250'} +[2023-09-14 12:48:02,626][102046] Sum rewards: 3.578, reward structure: {'HEALTH': '-3.250', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.016', 'AMMO5': '0.020', 'AMMO4': '0.080', 'AMMO3': '0.081', 'WEAPON4': '0.200', 'weapon4': '0.240', 'weapon2': '0.244', 'WEAPON5': '0.400', 'WEAPON3': '0.700', 'weapon5': '1.226', 'FRAGCOUNT': '2.000', 'weapon3': '2.270', 'DAMAGECOUNT': '2.350'} +[2023-09-14 12:48:02,673][102003] DAMAGECOUNT value on done: 465.0 +[2023-09-14 12:48:02,673][102003] DAMAGECOUNT value on done: 612.0 +[2023-09-14 12:48:02,674][102003] Sum rewards: 4.423, reward structure: {'HEALTH': '-1.220', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.039', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.046', 'weapon3': '1.300', 'weapon5': '1.678'} +[2023-09-14 12:48:02,674][102003] Sum rewards: 4.664, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.030', 'AMMO2': '0.034', 'WEAPON5': '0.100', 'AMMO4': '0.169', 'WEAPON4': '0.200', 'weapon2': '0.282', 'WEAPON3': '0.300', 'weapon4': '0.850', 'weapon3': '0.978', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.220', 'weapon5': '1.496'} +[2023-09-14 12:48:02,697][102001] DAMAGECOUNT value on done: 998.0 +[2023-09-14 12:48:02,697][102001] DAMAGECOUNT value on done: 640.0 +[2023-09-14 12:48:02,698][102001] Sum rewards: 5.649, reward structure: {'HEALTH': '-2.950', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.022', 'AMMO3': '0.053', 'AMMO4': '0.107', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon2': '0.316', 'WEAPON3': '0.500', 'weapon4': '0.892', 'weapon5': '0.944', 'weapon3': '1.480', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '3.670'} +[2023-09-14 12:48:02,698][102001] Sum rewards: 2.713, reward structure: {'HEALTH': '-3.150', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.016', 'AMMO5': '0.020', 'AMMO4': '0.081', 'AMMO3': '0.097', 'weapon4': '0.100', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'weapon5': '0.608', 'weapon2': '0.794', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '2.346', 'DAMAGECOUNT': '2.400'} +[2023-09-14 12:48:03,087][101964] Updated weights for policy 1, policy_version 1227 (0.0013) +[2023-09-14 12:48:03,146][102003] DAMAGECOUNT value on done: 963.0 +[2023-09-14 12:48:03,146][102003] DAMAGECOUNT value on done: 790.0 +[2023-09-14 12:48:03,721][102003] DAMAGECOUNT value on done: 1015.0 +[2023-09-14 12:48:03,722][102003] DAMAGECOUNT value on done: 735.0 +[2023-09-14 12:48:03,722][102003] Sum rewards: 4.562, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.017', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.236', 'weapon2': '0.348', 'WEAPON3': '0.400', 'weapon3': '1.364', 'weapon5': '1.744', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.000'} +[2023-09-14 12:48:03,722][102003] Sum rewards: 4.711, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.024', 'AMMO3': '0.059', 'AMMO4': '0.120', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon2': '0.310', 'WEAPON3': '0.500', 'weapon4': '0.828', 'weapon5': '0.950', 'weapon3': '1.354', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:48:04,037][102001] DAMAGECOUNT value on done: 1733.0 +[2023-09-14 12:48:04,037][102001] DAMAGECOUNT value on done: 1655.0 +[2023-09-14 12:48:04,038][102001] Sum rewards: 5.524, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO4': '0.007', 'AMMO5': '0.020', 'AMMO3': '0.093', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'weapon2': '0.422', 'weapon4': '0.482', 'weapon5': '0.586', 'WEAPON3': '0.800', 'weapon3': '2.362', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.150'} +[2023-09-14 12:48:04,038][102001] Sum rewards: 5.534, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.020', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'weapon4': '0.322', 'weapon2': '0.324', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'weapon5': '1.436', 'weapon3': '1.870', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.150'} +[2023-09-14 12:48:04,577][109198] Fps is (10 sec: 14335.9, 60 sec: 14267.7, 300 sec: 13658.9). Total num frames: 13430784. Throughput: 0: 1853.0, 1: 1698.0. Samples: 826123. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:48:04,579][109198] Avg episode reward: [(0, '4.900'), (1, '3.748')] +[2023-09-14 12:48:04,580][101718] Saving new best policy, reward=4.900! +[2023-09-14 12:48:04,580][101802] Saving new best policy, reward=3.748! +[2023-09-14 12:48:04,747][102001] DAMAGECOUNT value on done: 780.0 +[2023-09-14 12:48:04,748][102001] Sum rewards: 3.346, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.015', 'AMMO3': '0.062', 'AMMO4': '0.077', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon2': '0.402', 'WEAPON3': '0.500', 'weapon4': '0.584', 'FRAGCOUNT': '1.000', 'weapon3': '1.314', 'weapon5': '1.432', 'DAMAGECOUNT': '1.450'} +[2023-09-14 12:48:04,748][102001] DAMAGECOUNT value on done: 746.0 +[2023-09-14 12:48:04,749][102001] Sum rewards: 6.085, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.020', 'AMMO3': '0.044', 'AMMO4': '0.099', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.404', 'weapon4': '0.694', 'weapon5': '1.014', 'weapon3': '1.202', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.300'} +[2023-09-14 12:48:07,159][101965] Updated weights for policy 0, policy_version 2055 (0.0014) +[2023-09-14 12:48:09,165][101964] Updated weights for policy 1, policy_version 1237 (0.0012) +[2023-09-14 12:48:09,577][109198] Fps is (10 sec: 13926.4, 60 sec: 14199.5, 300 sec: 13664.3). Total num frames: 13500416. Throughput: 0: 1853.2, 1: 1697.7. Samples: 847543. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:48:09,579][109198] Avg episode reward: [(0, '4.900'), (1, '3.739')] +[2023-09-14 12:48:12,757][101965] Updated weights for policy 0, policy_version 2065 (0.0013) +[2023-09-14 12:48:12,869][102004] DAMAGECOUNT value on done: 1399.0 +[2023-09-14 12:48:12,869][102004] Sum rewards: 0.164, reward structure: {'HEALTH': '-6.150', 'DEATHCOUNT': '-6.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.036', 'AMMO3': '0.161', 'AMMO4': '0.179', 'weapon4': '0.280', 'weapon5': '0.286', 'WEAPON4': '0.400', 'WEAPON5': '0.500', 'weapon2': '0.994', 'WEAPON3': '1.100', 'weapon3': '2.302', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.050'} +[2023-09-14 12:48:12,870][102004] DAMAGECOUNT value on done: 2261.0 +[2023-09-14 12:48:12,870][102004] Sum rewards: 11.684, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.066', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.338', 'weapon2': '0.346', 'WEAPON3': '0.600', 'weapon5': '1.260', 'weapon3': '2.016', 'FRAGCOUNT': '6.000', 'DAMAGECOUNT': '6.550'} +[2023-09-14 12:48:13,364][102004] DAMAGECOUNT value on done: 1240.0 +[2023-09-14 12:48:13,365][102004] DAMAGECOUNT value on done: 1210.0 +[2023-09-14 12:48:13,365][102004] Sum rewards: 6.235, reward structure: {'HEALTH': '-1.650', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.010', 'weapon2': '0.030', 'AMMO3': '0.041', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.204', 'WEAPON3': '0.400', 'weapon3': '1.350', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100', 'weapon5': '2.450'} +[2023-09-14 12:48:13,366][102004] Sum rewards: 3.837, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO5': '0.015', 'AMMO4': '0.050', 'AMMO3': '0.073', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'weapon4': '0.302', 'weapon2': '0.346', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon5': '1.536', 'DAMAGECOUNT': '1.700', 'weapon3': '1.804'} +[2023-09-14 12:48:14,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14267.7, 300 sec: 13685.5). Total num frames: 13574144. Throughput: 0: 1861.0, 1: 1706.9. Samples: 869401. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:48:14,579][109198] Avg episode reward: [(0, '4.939'), (1, '3.739')] +[2023-09-14 12:48:14,580][101718] Saving new best policy, reward=4.939! +[2023-09-14 12:48:14,966][101964] Updated weights for policy 1, policy_version 1247 (0.0011) +[2023-09-14 12:48:15,671][102040] Large shaping reward 2.942 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 2.0), ('DAMAGECOUNT', 1.94, 194.0), ('weapon5', 0.002)] +[2023-09-14 12:48:18,107][101965] Updated weights for policy 0, policy_version 2075 (0.0012) +[2023-09-14 12:48:19,577][109198] Fps is (10 sec: 14335.9, 60 sec: 14267.7, 300 sec: 13690.1). Total num frames: 13643776. Throughput: 0: 1865.3, 1: 1713.7. Samples: 880128. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:48:19,579][109198] Avg episode reward: [(0, '4.939'), (1, '3.739')] +[2023-09-14 12:48:20,830][101964] Updated weights for policy 1, policy_version 1257 (0.0013) +[2023-09-14 12:48:22,774][102037] DAMAGECOUNT value on done: 1701.0 +[2023-09-14 12:48:22,775][102037] Sum rewards: 7.261, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.006', 'AMMO5': '0.010', 'weapon2': '0.028', 'AMMO4': '0.028', 'AMMO3': '0.040', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.502', 'weapon3': '1.398', 'FRAGCOUNT': '1.999', 'weapon5': '2.050', 'DAMAGECOUNT': '2.400'} +[2023-09-14 12:48:22,775][102037] DAMAGECOUNT value on done: 1300.0 +[2023-09-14 12:48:23,321][102037] DAMAGECOUNT value on done: 910.0 +[2023-09-14 12:48:23,321][102037] DAMAGECOUNT value on done: 942.0 +[2023-09-14 12:48:23,322][102037] Sum rewards: 2.372, reward structure: {'HEALTH': '-1.960', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.006', 'AMMO5': '0.010', 'AMMO4': '0.031', 'AMMO3': '0.048', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.204', 'weapon2': '0.316', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.450', 'weapon3': '1.306', 'weapon5': '2.162'} +[2023-09-14 12:48:23,507][101965] Updated weights for policy 0, policy_version 2085 (0.0013) +[2023-09-14 12:48:23,628][102037] DAMAGECOUNT value on done: 1860.0 +[2023-09-14 12:48:23,628][102037] DAMAGECOUNT value on done: 1750.0 +[2023-09-14 12:48:23,629][102037] Sum rewards: 4.487, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.018', 'AMMO3': '0.077', 'AMMO4': '0.090', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.350', 'weapon2': '0.374', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon5': '1.572', 'weapon3': '1.640', 'DAMAGECOUNT': '2.250'} +[2023-09-14 12:48:23,629][102037] Sum rewards: 4.171, reward structure: {'HEALTH': '-2.950', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.010', 'AMMO2': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'weapon4': '0.044', 'AMMO3': '0.067', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.722', 'weapon5': '1.296', 'weapon3': '1.890', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:48:24,231][102037] DAMAGECOUNT value on done: 930.0 +[2023-09-14 12:48:24,231][102037] DAMAGECOUNT value on done: 899.0 +[2023-09-14 12:48:24,232][102037] Sum rewards: 3.431, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.030', 'AMMO3': '0.049', 'WEAPON4': '0.100', 'AMMO4': '0.150', 'WEAPON5': '0.200', 'weapon2': '0.210', 'WEAPON3': '0.400', 'weapon4': '0.566', 'DAMAGECOUNT': '0.950', 'weapon3': '1.164', 'weapon5': '1.604'} +[2023-09-14 12:48:24,577][109198] Fps is (10 sec: 14336.1, 60 sec: 14267.7, 300 sec: 13710.0). Total num frames: 13717504. Throughput: 0: 1865.4, 1: 1711.9. Samples: 901608. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:48:24,579][109198] Avg episode reward: [(0, '4.883'), (1, '3.713')] +[2023-09-14 12:48:24,798][102005] DAMAGECOUNT value on done: 678.0 +[2023-09-14 12:48:24,798][102005] DAMAGECOUNT value on done: 580.0 +[2023-09-14 12:48:24,798][102005] Sum rewards: 6.564, reward structure: {'HEALTH': '-0.650', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'AMMO2': '0.020', 'weapon2': '0.076', 'AMMO4': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.610', 'weapon3': '0.674', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '2.020', 'weapon5': '2.292'} +[2023-09-14 12:48:25,300][102005] DAMAGECOUNT value on done: 1139.0 +[2023-09-14 12:48:25,301][102005] DAMAGECOUNT value on done: 1458.0 +[2023-09-14 12:48:25,301][102005] Sum rewards: 5.803, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.030', 'weapon2': '0.044', 'AMMO3': '0.057', 'AMMO4': '0.149', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'weapon4': '1.020', 'weapon5': '1.360', 'weapon3': '1.382', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.850'} +[2023-09-14 12:48:25,302][102005] Sum rewards: 2.478, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.008', 'AMMO5': '0.009', 'AMMO4': '0.041', 'weapon2': '0.066', 'AMMO3': '0.077', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon4': '0.654', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon5': '1.092', 'weapon3': '1.830', 'DAMAGECOUNT': '2.500'} +[2023-09-14 12:48:26,793][101964] Updated weights for policy 1, policy_version 1267 (0.0012) +[2023-09-14 12:48:26,998][102039] Large shaping reward 2.602 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 1.0), ('DAMAGECOUNT', 1.6, 160.0), ('weapon5', 0.002)] +[2023-09-14 12:48:27,196][102040] DAMAGECOUNT value on done: 955.0 +[2023-09-14 12:48:27,197][102040] DAMAGECOUNT value on done: 1175.0 +[2023-09-14 12:48:27,197][102040] Sum rewards: 4.996, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.050', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.610', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '1.368', 'weapon5': '2.008'} +[2023-09-14 12:48:27,198][102040] Sum rewards: 4.017, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.007', 'AMMO4': '0.035', 'AMMO3': '0.040', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.304', 'WEAPON3': '0.400', 'weapon2': '0.590', 'FRAGCOUNT': '1.000', 'weapon5': '1.000', 'DAMAGECOUNT': '1.150', 'weapon3': '1.288'} +[2023-09-14 12:48:27,748][102040] DAMAGECOUNT value on done: 557.0 +[2023-09-14 12:48:27,748][102040] DAMAGECOUNT value on done: 870.0 +[2023-09-14 12:48:27,749][102040] Sum rewards: 3.800, reward structure: {'HEALTH': '-2.500', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.011', 'AMMO5': '0.015', 'AMMO4': '0.053', 'AMMO3': '0.059', 'WEAPON4': '0.200', 'weapon4': '0.206', 'WEAPON5': '0.300', 'weapon5': '0.426', 'WEAPON3': '0.600', 'weapon2': '0.698', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '2.150', 'weapon3': '2.582'} +[2023-09-14 12:48:27,749][102040] Sum rewards: 4.529, reward structure: {'HEALTH': '-2.200', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.025', 'AMMO3': '0.090', 'AMMO4': '0.126', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon2': '0.554', 'WEAPON3': '0.600', 'weapon3': '0.914', 'weapon4': '0.990', 'FRAGCOUNT': '1.000', 'weapon5': '1.392', 'DAMAGECOUNT': '2.530'} +[2023-09-14 12:48:28,699][102004] DAMAGECOUNT value on done: 1766.0 +[2023-09-14 12:48:28,699][102004] DAMAGECOUNT value on done: 1431.0 +[2023-09-14 12:48:28,699][102004] Sum rewards: 6.518, reward structure: {'HEALTH': '-1.350', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'weapon2': '0.166', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.392', 'WEAPON3': '0.400', 'weapon3': '1.300', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050', 'weapon5': '2.110'} +[2023-09-14 12:48:28,700][102004] Sum rewards: 3.512, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.009', 'AMMO5': '0.015', 'AMMO4': '0.047', 'AMMO3': '0.062', 'weapon2': '0.084', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'weapon4': '0.404', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.350', 'weapon5': '1.400', 'weapon3': '2.140'} +[2023-09-14 12:48:28,835][102005] DAMAGECOUNT value on done: 903.0 +[2023-09-14 12:48:28,835][102005] DAMAGECOUNT value on done: 852.0 +[2023-09-14 12:48:28,836][102005] Sum rewards: 3.812, reward structure: {'HEALTH': '-2.500', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.013', 'AMMO3': '0.051', 'AMMO4': '0.063', 'weapon2': '0.068', 'WEAPON5': '0.100', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon4': '0.566', 'weapon5': '0.922', 'weapon3': '1.716', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.010'} +[2023-09-14 12:48:28,836][102005] Sum rewards: 3.632, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.029', 'AMMO3': '0.078', 'AMMO4': '0.146', 'WEAPON5': '0.200', 'weapon2': '0.200', 'WEAPON4': '0.300', 'weapon5': '0.554', 'WEAPON3': '0.700', 'weapon4': '0.950', 'weapon3': '1.968', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.500'} +[2023-09-14 12:48:28,931][101965] Updated weights for policy 0, policy_version 2095 (0.0012) +[2023-09-14 12:48:29,328][102004] DAMAGECOUNT value on done: 1079.0 +[2023-09-14 12:48:29,329][102004] DAMAGECOUNT value on done: 1075.0 +[2023-09-14 12:48:29,409][102005] DAMAGECOUNT value on done: 2115.0 +[2023-09-14 12:48:29,409][102005] DAMAGECOUNT value on done: 2110.0 +[2023-09-14 12:48:29,410][102005] Sum rewards: 4.078, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-6.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO4': '0.011', 'AMMO5': '0.025', 'WEAPON4': '0.100', 'AMMO3': '0.159', 'weapon4': '0.160', 'WEAPON5': '0.500', 'weapon5': '0.550', 'weapon2': '0.784', 'WEAPON3': '1.100', 'weapon3': '2.238', 'FRAGCOUNT': '4.999', 'DAMAGECOUNT': '5.450'} +[2023-09-14 12:48:29,410][102005] Sum rewards: 6.239, reward structure: {'HEALTH': '-5.200', 'DEATHCOUNT': '-5.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.041', 'weapon5': '0.100', 'weapon4': '0.132', 'AMMO3': '0.160', 'AMMO4': '0.203', 'WEAPON4': '0.300', 'weapon2': '0.406', 'WEAPON5': '0.500', 'WEAPON3': '1.200', 'weapon3': '3.222', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.150'} +[2023-09-14 12:48:29,577][109198] Fps is (10 sec: 14745.7, 60 sec: 14336.0, 300 sec: 13729.2). Total num frames: 13791232. Throughput: 0: 1869.6, 1: 1718.6. Samples: 923503. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:48:29,579][109198] Avg episode reward: [(0, '4.924'), (1, '3.835')] +[2023-09-14 12:48:29,586][101802] Saving new best policy, reward=3.835! +[2023-09-14 12:48:31,396][102040] DAMAGECOUNT value on done: 954.0 +[2023-09-14 12:48:31,397][102040] DAMAGECOUNT value on done: 1176.0 +[2023-09-14 12:48:31,397][102040] Sum rewards: 5.706, reward structure: {'HEALTH': '-1.360', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.022', 'AMMO3': '0.050', 'WEAPON5': '0.100', 'AMMO4': '0.109', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.440', 'weapon4': '0.612', 'weapon2': '0.726', 'weapon3': '0.964', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.440'} +[2023-09-14 12:48:31,397][102040] Sum rewards: 2.066, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.025', 'AMMO3': '0.040', 'AMMO4': '0.124', 'weapon2': '0.136', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.606', 'weapon4': '0.676', 'FRAGCOUNT': '1.000', 'weapon3': '1.292', 'DAMAGECOUNT': '1.360'} +[2023-09-14 12:48:31,949][102040] DAMAGECOUNT value on done: 1620.0 +[2023-09-14 12:48:31,949][102040] DAMAGECOUNT value on done: 1680.0 +[2023-09-14 12:48:31,950][102040] Sum rewards: 0.509, reward structure: {'DEATHCOUNT': '-4.000', 'HEALTH': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.023', 'AMMO5': '0.024', 'AMMO4': '0.114', 'AMMO3': '0.124', 'WEAPON4': '0.300', 'WEAPON5': '0.500', 'weapon5': '0.518', 'weapon4': '0.576', 'FRAGCOUNT': '0.999', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.650', 'weapon3': '2.680'} +[2023-09-14 12:48:31,950][102040] Sum rewards: 7.629, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.022', 'AMMO3': '0.060', 'weapon2': '0.062', 'AMMO4': '0.108', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon4': '0.784', 'weapon5': '1.398', 'weapon3': '1.686', 'FRAGCOUNT': '2.999', 'DAMAGECOUNT': '3.500'} +[2023-09-14 12:48:32,800][101964] Updated weights for policy 1, policy_version 1277 (0.0012) +[2023-09-14 12:48:34,501][101965] Updated weights for policy 0, policy_version 2105 (0.0012) +[2023-09-14 12:48:34,577][109198] Fps is (10 sec: 14745.5, 60 sec: 14404.3, 300 sec: 13747.7). Total num frames: 13864960. Throughput: 0: 1869.6, 1: 1720.2. Samples: 934250. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:48:34,579][109198] Avg episode reward: [(0, '4.874'), (1, '3.842')] +[2023-09-14 12:48:34,581][101802] Saving new best policy, reward=3.842! +[2023-09-14 12:48:38,667][102046] DAMAGECOUNT value on done: 900.0 +[2023-09-14 12:48:38,668][102046] DAMAGECOUNT value on done: 1010.0 +[2023-09-14 12:48:38,668][102046] Sum rewards: 1.355, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO2': '0.026', 'AMMO3': '0.059', 'AMMO4': '0.128', 'WEAPON5': '0.200', 'weapon2': '0.256', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon5': '0.758', 'DAMAGECOUNT': '0.850', 'weapon4': '0.852', 'weapon3': '1.422'} +[2023-09-14 12:48:39,005][101964] Updated weights for policy 1, policy_version 1287 (0.0012) +[2023-09-14 12:48:39,283][102039] DAMAGECOUNT value on done: 920.0 +[2023-09-14 12:48:39,284][102039] DAMAGECOUNT value on done: 770.0 +[2023-09-14 12:48:39,284][102039] Sum rewards: 4.814, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.698', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.500', 'weapon3': '1.520', 'weapon5': '1.806'} +[2023-09-14 12:48:39,285][102039] Sum rewards: 4.487, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.025', 'AMMO3': '0.077', 'AMMO4': '0.127', 'weapon2': '0.142', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.600', 'weapon4': '0.888', 'FRAGCOUNT': '0.999', 'weapon5': '1.322', 'weapon3': '1.398', 'DAMAGECOUNT': '2.400'} +[2023-09-14 12:48:39,315][102046] DAMAGECOUNT value on done: 1009.0 +[2023-09-14 12:48:39,315][102046] DAMAGECOUNT value on done: 1470.0 +[2023-09-14 12:48:39,317][102046] Sum rewards: 3.431, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.006', 'AMMO4': '0.032', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.228', 'weapon5': '0.310', 'WEAPON3': '0.400', 'weapon2': '0.876', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon3': '1.186'} +[2023-09-14 12:48:39,316][102046] Sum rewards: 3.496, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.020', 'AMMO3': '0.030', 'AMMO4': '0.100', 'AMMO6': '0.100', 'AMMO7': '0.100', 'weapon6': '0.148', 'WEAPON4': '0.200', 'WEAPON6': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.464', 'weapon4': '0.676', 'FRAGCOUNT': '1.000', 'weapon3': '1.048', 'DAMAGECOUNT': '1.110'} +[2023-09-14 12:48:39,577][109198] Fps is (10 sec: 13516.8, 60 sec: 14267.7, 300 sec: 13721.6). Total num frames: 13926400. Throughput: 0: 1867.9, 1: 1716.6. Samples: 955203. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:48:39,579][109198] Avg episode reward: [(0, '4.894'), (1, '3.839')] +[2023-09-14 12:48:39,854][102039] DAMAGECOUNT value on done: 1756.0 +[2023-09-14 12:48:39,854][102039] DAMAGECOUNT value on done: 1176.0 +[2023-09-14 12:48:39,855][102039] Sum rewards: 4.794, reward structure: {'HEALTH': '-0.500', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.015', 'weapon2': '0.016', 'AMMO3': '0.020', 'AMMO4': '0.074', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.504', 'weapon3': '0.638', 'weapon5': '0.954', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.670'} +[2023-09-14 12:48:40,196][101965] Updated weights for policy 0, policy_version 2115 (0.0012) +[2023-09-14 12:48:40,575][102046] DAMAGECOUNT value on done: 762.0 +[2023-09-14 12:48:40,575][102046] Sum rewards: 4.829, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.020', 'weapon2': '0.034', 'AMMO3': '0.068', 'AMMO4': '0.099', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'weapon4': '0.800', 'weapon3': '1.052', 'weapon5': '1.478', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.370'} +[2023-09-14 12:48:40,576][102046] DAMAGECOUNT value on done: 644.0 +[2023-09-14 12:48:40,576][102046] Sum rewards: 1.415, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.012', 'AMMO2': '0.021', 'AMMO3': '0.100', 'AMMO4': '0.106', 'weapon2': '0.254', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'WEAPON3': '0.700', 'weapon4': '0.762', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '1.386', 'weapon5': '1.424'} +[2023-09-14 12:48:40,671][102003] DAMAGECOUNT value on done: 1385.0 +[2023-09-14 12:48:40,672][102003] DAMAGECOUNT value on done: 1535.0 +[2023-09-14 12:48:40,672][102003] Sum rewards: 6.618, reward structure: {'HEALTH': '-1.750', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.292', 'weapon4': '0.344', 'WEAPON3': '0.400', 'weapon5': '1.544', 'weapon3': '1.640', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.700'} +[2023-09-14 12:48:41,058][102001] DAMAGECOUNT value on done: 760.0 +[2023-09-14 12:48:41,058][102001] DAMAGECOUNT value on done: 787.0 +[2023-09-14 12:48:41,059][102001] Sum rewards: 2.511, reward structure: {'HEALTH': '-1.320', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.058', 'DAMAGECOUNT': '0.150', 'WEAPON5': '0.200', 'weapon2': '0.366', 'WEAPON3': '0.400', 'weapon3': '0.846', 'weapon5': '2.832'} +[2023-09-14 12:48:41,136][102039] DAMAGECOUNT value on done: 718.0 +[2023-09-14 12:48:41,136][102039] DAMAGECOUNT value on done: 1165.0 +[2023-09-14 12:48:41,138][102039] Sum rewards: 5.911, reward structure: {'HEALTH': '-0.390', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.396', 'weapon3': '0.802', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon5': '2.708'} +[2023-09-14 12:48:41,261][102046] DAMAGECOUNT value on done: 1426.0 +[2023-09-14 12:48:41,261][102046] Sum rewards: 3.538, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.041', 'AMMO3': '0.070', 'WEAPON5': '0.100', 'AMMO4': '0.205', 'WEAPON4': '0.300', 'weapon2': '0.492', 'WEAPON3': '0.600', 'weapon4': '0.672', 'weapon5': '0.744', 'FRAGCOUNT': '0.999', 'weapon3': '1.560', 'DAMAGECOUNT': '1.750'} +[2023-09-14 12:48:41,262][102046] DAMAGECOUNT value on done: 1025.0 +[2023-09-14 12:48:41,262][102046] Sum rewards: 4.952, reward structure: {'HEALTH': '-1.750', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.022', 'AMMO3': '0.054', 'AMMO4': '0.110', 'weapon2': '0.186', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.332', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon3': '1.156', 'DAMAGECOUNT': '1.750', 'weapon5': '2.282'} +[2023-09-14 12:48:41,267][102003] DAMAGECOUNT value on done: 640.0 +[2023-09-14 12:48:41,268][102003] DAMAGECOUNT value on done: 841.0 +[2023-09-14 12:48:41,268][102003] Sum rewards: 3.616, reward structure: {'HEALTH': '-2.240', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.015', 'AMMO4': '0.020', 'AMMO3': '0.060', 'WEAPON4': '0.200', 'weapon2': '0.214', 'WEAPON5': '0.300', 'weapon4': '0.480', 'WEAPON3': '0.600', 'weapon5': '0.924', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.750', 'weapon3': '2.288'} +[2023-09-14 12:48:41,269][102003] Sum rewards: 5.663, reward structure: {'HEALTH': '-1.700', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.025', 'AMMO3': '0.044', 'AMMO4': '0.124', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.390', 'WEAPON3': '0.400', 'weapon4': '0.750', 'weapon2': '0.754', 'weapon3': '1.178', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.290'} +[2023-09-14 12:48:41,689][102003] DAMAGECOUNT value on done: 1210.0 +[2023-09-14 12:48:41,689][102003] DAMAGECOUNT value on done: 940.0 +[2023-09-14 12:48:41,689][102003] Sum rewards: 4.983, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO3': '0.077', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.846', 'weapon5': '1.038', 'weapon3': '1.650', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.470'} +[2023-09-14 12:48:41,690][102003] Sum rewards: 2.862, reward structure: {'HEALTH': '-2.420', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.020', 'AMMO3': '0.061', 'AMMO4': '0.099', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon2': '0.354', 'WEAPON3': '0.500', 'weapon4': '0.922', 'FRAGCOUNT': '1.000', 'weapon5': '1.020', 'weapon3': '1.296', 'DAMAGECOUNT': '1.500'} +[2023-09-14 12:48:41,725][102039] DAMAGECOUNT value on done: 1120.0 +[2023-09-14 12:48:41,726][102039] DAMAGECOUNT value on done: 966.0 +[2023-09-14 12:48:41,781][102001] DAMAGECOUNT value on done: 1248.0 +[2023-09-14 12:48:41,782][102001] DAMAGECOUNT value on done: 835.0 +[2023-09-14 12:48:41,782][102001] Sum rewards: 3.239, reward structure: {'HEALTH': '-2.500', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.019', 'AMMO3': '0.068', 'weapon5': '0.092', 'AMMO4': '0.093', 'weapon2': '0.134', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'weapon4': '0.802', 'weapon3': '1.124', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.500'} +[2023-09-14 12:48:41,783][102001] Sum rewards: 3.719, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'weapon2': '0.018', 'AMMO5': '0.020', 'AMMO2': '0.026', 'AMMO3': '0.107', 'AMMO4': '0.129', 'WEAPON4': '0.300', 'weapon4': '0.310', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'weapon5': '1.500', 'DAMAGECOUNT': '1.950', 'FRAGCOUNT': '1.999', 'weapon3': '2.160'} +[2023-09-14 12:48:42,336][102003] DAMAGECOUNT value on done: 1055.0 +[2023-09-14 12:48:42,337][102003] Sum rewards: 4.884, reward structure: {'HEALTH': '-3.200', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'AMMO2': '0.025', 'AMMO3': '0.055', 'AMMO4': '0.126', 'WEAPON5': '0.300', 'weapon5': '0.320', 'WEAPON4': '0.400', 'weapon2': '0.424', 'WEAPON3': '0.500', 'weapon4': '1.096', 'weapon3': '1.624', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.200'} +[2023-09-14 12:48:42,337][102003] DAMAGECOUNT value on done: 1350.0 +[2023-09-14 12:48:42,337][102003] Sum rewards: 5.944, reward structure: {'HEALTH': '-3.150', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.040', 'AMMO3': '0.090', 'weapon4': '0.130', 'AMMO4': '0.198', 'WEAPON4': '0.300', 'weapon2': '0.386', 'WEAPON5': '0.400', 'weapon5': '0.498', 'WEAPON3': '0.800', 'weapon3': '2.882', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.350'} +[2023-09-14 12:48:43,172][102001] DAMAGECOUNT value on done: 2238.0 +[2023-09-14 12:48:43,172][102001] DAMAGECOUNT value on done: 2275.0 +[2023-09-14 12:48:43,172][102001] Sum rewards: 4.434, reward structure: {'HEALTH': '-6.000', 'DEATHCOUNT': '-6.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.037', 'weapon2': '0.084', 'AMMO3': '0.158', 'AMMO4': '0.184', 'WEAPON4': '0.500', 'WEAPON5': '0.500', 'weapon4': '0.662', 'weapon5': '0.742', 'WEAPON3': '1.100', 'weapon3': '2.392', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.050'} +[2023-09-14 12:48:43,173][102001] Sum rewards: 8.339, reward structure: {'HEALTH': '-5.000', 'DEATHCOUNT': '-5.000', 'HITCOUNT': '0.000', 'weapon2': '0.006', 'AMMO2': '0.024', 'AMMO5': '0.025', 'AMMO4': '0.119', 'AMMO3': '0.145', 'weapon5': '0.350', 'weapon4': '0.360', 'WEAPON4': '0.400', 'WEAPON5': '0.500', 'WEAPON3': '1.100', 'weapon3': '3.110', 'FRAGCOUNT': '6.000', 'DAMAGECOUNT': '6.200'} +[2023-09-14 12:48:43,765][102001] DAMAGECOUNT value on done: 791.0 +[2023-09-14 12:48:43,765][102001] DAMAGECOUNT value on done: 830.0 +[2023-09-14 12:48:43,766][102001] Sum rewards: 2.271, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.025', 'AMMO3': '0.040', 'AMMO4': '0.125', 'weapon2': '0.164', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.318', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.500', 'weapon4': '0.894', 'weapon3': '1.396'} +[2023-09-14 12:48:44,577][109198] Fps is (10 sec: 13516.9, 60 sec: 14267.7, 300 sec: 13739.6). Total num frames: 14000128. Throughput: 0: 1863.3, 1: 1710.0. Samples: 976140. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:48:44,579][109198] Avg episode reward: [(0, '4.927'), (1, '3.921')] +[2023-09-14 12:48:44,580][101802] Saving new best policy, reward=3.921! +[2023-09-14 12:48:45,149][101964] Updated weights for policy 1, policy_version 1297 (0.0012) +[2023-09-14 12:48:45,728][101965] Updated weights for policy 0, policy_version 2125 (0.0013) +[2023-09-14 12:48:46,935][102004] DAMAGECOUNT value on done: 1834.0 +[2023-09-14 12:48:46,936][102004] Sum rewards: 7.291, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.014', 'AMMO3': '0.056', 'weapon4': '0.082', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'weapon2': '0.450', 'WEAPON3': '0.500', 'weapon5': '1.584', 'weapon3': '1.850', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '4.350'} +[2023-09-14 12:48:46,936][102004] DAMAGECOUNT value on done: 2436.0 +[2023-09-14 12:48:46,937][102004] Sum rewards: 1.701, reward structure: {'HEALTH': '-3.450', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.015', 'AMMO4': '0.033', 'WEAPON4': '0.100', 'AMMO3': '0.116', 'weapon4': '0.176', 'WEAPON5': '0.300', 'weapon2': '0.350', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon5': '1.724', 'DAMAGECOUNT': '1.750', 'weapon3': '1.780'} +[2023-09-14 12:48:47,506][102004] DAMAGECOUNT value on done: 1655.0 +[2023-09-14 12:48:47,506][102004] DAMAGECOUNT value on done: 1625.0 +[2023-09-14 12:48:47,507][102004] Sum rewards: 6.682, reward structure: {'HEALTH': '-3.900', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.020', 'weapon5': '0.036', 'AMMO3': '0.084', 'AMMO4': '0.100', 'WEAPON4': '0.200', 'weapon4': '0.212', 'weapon2': '0.228', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'weapon3': '3.332', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.150'} +[2023-09-14 12:48:47,507][102004] Sum rewards: 5.145, reward structure: {'DEATHCOUNT': '-4.000', 'HEALTH': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'weapon5': '0.030', 'AMMO2': '0.034', 'AMMO3': '0.128', 'AMMO4': '0.170', 'weapon4': '0.250', 'WEAPON4': '0.300', 'WEAPON5': '0.500', 'weapon2': '0.500', 'WEAPON3': '1.000', 'FRAGCOUNT': '3.000', 'weapon3': '3.058', 'DAMAGECOUNT': '4.150'} +[2023-09-14 12:48:49,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14267.7, 300 sec: 13742.8). Total num frames: 14069760. Throughput: 0: 1866.2, 1: 1712.1. Samples: 987145. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:48:49,579][109198] Avg episode reward: [(0, '4.885'), (1, '3.921')] +[2023-09-14 12:48:51,140][101964] Updated weights for policy 1, policy_version 1307 (0.0015) +[2023-09-14 12:48:51,263][101965] Updated weights for policy 0, policy_version 2135 (0.0014) +[2023-09-14 12:48:54,578][109198] Fps is (10 sec: 14334.4, 60 sec: 14267.5, 300 sec: 13759.7). Total num frames: 14143488. Throughput: 0: 1854.7, 1: 1703.2. Samples: 1007653. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:48:54,581][109198] Avg episode reward: [(0, '4.885'), (1, '3.921')] +[2023-09-14 12:48:56,724][101965] Updated weights for policy 0, policy_version 2145 (0.0012) +[2023-09-14 12:48:57,024][101964] Updated weights for policy 1, policy_version 1317 (0.0011) +[2023-09-14 12:48:59,577][109198] Fps is (10 sec: 14745.6, 60 sec: 14267.7, 300 sec: 14009.7). Total num frames: 14217216. Throughput: 0: 1856.2, 1: 1703.1. Samples: 1029571. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:48:59,579][109198] Avg episode reward: [(0, '4.885'), (1, '3.921')] +[2023-09-14 12:48:59,795][102037] DAMAGECOUNT value on done: 1981.0 +[2023-09-14 12:48:59,795][102037] DAMAGECOUNT value on done: 1670.0 +[2023-09-14 12:48:59,796][102037] Sum rewards: 3.945, reward structure: {'HEALTH': '-3.600', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'weapon2': '0.034', 'AMMO2': '0.034', 'AMMO3': '0.110', 'AMMO4': '0.172', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'weapon4': '0.718', 'WEAPON3': '0.800', 'weapon5': '0.916', 'FRAGCOUNT': '2.000', 'weapon3': '2.240', 'DAMAGECOUNT': '2.800'} +[2023-09-14 12:48:59,796][102037] Sum rewards: 6.957, reward structure: {'HEALTH': '-2.800', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.060', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon5': '0.394', 'weapon4': '0.464', 'weapon2': '0.534', 'WEAPON3': '0.600', 'weapon3': '2.490', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.700'} +[2023-09-14 12:49:00,310][102037] DAMAGECOUNT value on done: 1072.0 +[2023-09-14 12:49:00,310][102037] DAMAGECOUNT value on done: 1015.0 +[2023-09-14 12:49:00,312][102037] Sum rewards: 3.647, reward structure: {'HEALTH': '-1.060', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.025', 'AMMO2': '0.030', 'WEAPON5': '0.100', 'AMMO4': '0.149', 'WEAPON4': '0.200', 'WEAPON3': '0.200', 'weapon2': '0.368', 'weapon3': '0.572', 'weapon5': '0.852', 'weapon4': '0.908', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.300'} +[2023-09-14 12:49:00,312][102037] Sum rewards: 4.429, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.304', 'weapon2': '0.362', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon5': '1.538', 'weapon3': '1.726'} +[2023-09-14 12:49:00,744][102037] DAMAGECOUNT value on done: 2005.0 +[2023-09-14 12:49:00,745][102037] Sum rewards: 3.627, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.018', 'weapon4': '0.038', 'AMMO3': '0.072', 'AMMO4': '0.092', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.730', 'FRAGCOUNT': '1.000', 'weapon5': '1.396', 'DAMAGECOUNT': '1.450', 'weapon3': '1.816'} +[2023-09-14 12:49:00,745][102037] DAMAGECOUNT value on done: 1965.0 +[2023-09-14 12:49:00,746][102037] Sum rewards: 6.598, reward structure: {'HEALTH': '-1.450', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.025', 'AMMO3': '0.040', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.504', 'weapon5': '1.700', 'weapon3': '1.814', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150'} +[2023-09-14 12:49:01,322][102037] DAMAGECOUNT value on done: 1195.0 +[2023-09-14 12:49:01,322][102037] DAMAGECOUNT value on done: 1009.0 +[2023-09-14 12:49:01,322][102037] Sum rewards: 6.580, reward structure: {'HEALTH': '-1.900', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.422', 'weapon3': '1.490', 'FRAGCOUNT': '1.999', 'weapon5': '2.070', 'DAMAGECOUNT': '2.650'} +[2023-09-14 12:49:01,323][102037] Sum rewards: 0.042, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.046', 'AMMO3': '0.095', 'weapon2': '0.100', 'WEAPON5': '0.200', 'AMMO4': '0.232', 'WEAPON4': '0.400', 'weapon5': '0.430', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.100', 'weapon4': '1.102', 'weapon3': '1.628'} +[2023-09-14 12:49:01,548][102005] DAMAGECOUNT value on done: 788.0 +[2023-09-14 12:49:01,548][102005] DAMAGECOUNT value on done: 780.0 +[2023-09-14 12:49:01,549][102005] Sum rewards: 3.195, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.027', 'AMMO3': '0.068', 'AMMO4': '0.135', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon2': '0.376', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon4': '1.062', 'DAMAGECOUNT': '1.100', 'weapon3': '1.120', 'weapon5': '1.296'} +[2023-09-14 12:49:01,549][102005] Sum rewards: 6.673, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'weapon2': '0.018', 'AMMO4': '0.024', 'AMMO3': '0.040', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.522', 'weapon3': '1.672', 'weapon5': '1.682', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.000'} +[2023-09-14 12:49:02,112][102005] DAMAGECOUNT value on done: 1209.0 +[2023-09-14 12:49:02,112][102005] DAMAGECOUNT value on done: 1779.0 +[2023-09-14 12:49:02,113][102005] Sum rewards: 8.033, reward structure: {'HEALTH': '-0.910', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'AMMO2': '0.020', 'AMMO4': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.412', 'weapon4': '0.486', 'weapon3': '0.584', 'weapon5': '0.708', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.210'} +[2023-09-14 12:49:02,227][101965] Updated weights for policy 0, policy_version 2155 (0.0013) +[2023-09-14 12:49:02,962][101964] Updated weights for policy 1, policy_version 1327 (0.0013) +[2023-09-14 12:49:03,932][102040] DAMAGECOUNT value on done: 980.0 +[2023-09-14 12:49:03,932][102040] DAMAGECOUNT value on done: 1218.0 +[2023-09-14 12:49:04,521][102040] DAMAGECOUNT value on done: 623.0 +[2023-09-14 12:49:04,521][102040] DAMAGECOUNT value on done: 905.0 +[2023-09-14 12:49:04,577][109198] Fps is (10 sec: 14337.5, 60 sec: 14267.7, 300 sec: 14218.0). Total num frames: 14286848. Throughput: 0: 1856.8, 1: 1702.9. Samples: 1040313. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:49:04,579][109198] Avg episode reward: [(0, '4.957'), (1, '3.887')] +[2023-09-14 12:49:04,580][101718] Saving new best policy, reward=4.957! +[2023-09-14 12:49:05,613][102004] DAMAGECOUNT value on done: 1997.0 +[2023-09-14 12:49:05,613][102004] DAMAGECOUNT value on done: 1766.0 +[2023-09-14 12:49:05,613][102004] Sum rewards: 2.160, reward structure: {'HEALTH': '-4.100', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.022', 'AMMO2': '0.040', 'weapon2': '0.114', 'AMMO3': '0.129', 'AMMO4': '0.199', 'weapon5': '0.290', 'WEAPON4': '0.300', 'weapon4': '0.428', 'WEAPON5': '0.500', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.310', 'weapon3': '2.928'} +[2023-09-14 12:49:05,614][102004] Sum rewards: 7.217, reward structure: {'HEALTH': '-2.250', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.008', 'AMMO5': '0.015', 'AMMO4': '0.042', 'AMMO3': '0.060', 'WEAPON4': '0.200', 'weapon4': '0.264', 'WEAPON5': '0.300', 'weapon5': '0.586', 'WEAPON3': '0.600', 'weapon2': '0.748', 'weapon3': '2.294', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.350'} +[2023-09-14 12:49:05,701][102005] DAMAGECOUNT value on done: 1103.0 +[2023-09-14 12:49:05,702][102005] DAMAGECOUNT value on done: 931.0 +[2023-09-14 12:49:05,702][102005] Sum rewards: 7.720, reward structure: {'HEALTH': '-0.790', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.017', 'AMMO3': '0.020', 'AMMO4': '0.082', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.254', 'weapon4': '0.436', 'weapon3': '0.646', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.000', 'weapon5': '2.650'} +[2023-09-14 12:49:06,161][102004] DAMAGECOUNT value on done: 1270.0 +[2023-09-14 12:49:06,162][102004] DAMAGECOUNT value on done: 1193.0 +[2023-09-14 12:49:06,162][102004] Sum rewards: 4.993, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.020', 'AMMO3': '0.040', 'AMMO4': '0.099', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.756', 'weapon5': '0.980', 'FRAGCOUNT': '1.000', 'weapon3': '1.328', 'DAMAGECOUNT': '1.910'} +[2023-09-14 12:49:06,162][102004] Sum rewards: 3.841, reward structure: {'HEALTH': '-1.910', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.030', 'AMMO2': '-0.006', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.436', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.180', 'weapon3': '1.744', 'weapon5': '1.776'} +[2023-09-14 12:49:06,253][102005] DAMAGECOUNT value on done: 2390.0 +[2023-09-14 12:49:06,254][102005] DAMAGECOUNT value on done: 2340.0 +[2023-09-14 12:49:06,254][102005] Sum rewards: 5.302, reward structure: {'HEALTH': '-2.250', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.080', 'WEAPON5': '0.300', 'weapon2': '0.360', 'WEAPON3': '0.600', 'weapon5': '1.724', 'weapon3': '1.752', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.750'} +[2023-09-14 12:49:06,254][102005] Sum rewards: 4.734, reward structure: {'HEALTH': '-2.750', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.015', 'weapon4': '0.016', 'AMMO4': '0.023', 'AMMO3': '0.081', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'weapon2': '0.346', 'WEAPON3': '0.600', 'weapon3': '1.694', 'FRAGCOUNT': '2.000', 'weapon5': '2.004', 'DAMAGECOUNT': '2.300'} +[2023-09-14 12:49:07,565][101965] Updated weights for policy 0, policy_version 2165 (0.0013) +[2023-09-14 12:49:08,103][102040] DAMAGECOUNT value on done: 1176.0 +[2023-09-14 12:49:08,104][102040] DAMAGECOUNT value on done: 989.0 +[2023-09-14 12:49:08,686][102040] DAMAGECOUNT value on done: 1880.0 +[2023-09-14 12:49:08,686][102040] DAMAGECOUNT value on done: 1665.0 +[2023-09-14 12:49:08,687][102040] Sum rewards: 8.032, reward structure: {'HEALTH': '-0.450', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO3': '0.019', 'AMMO4': '0.025', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.312', 'weapon3': '0.858', 'DAMAGECOUNT': '2.000', 'FRAGCOUNT': '2.000', 'weapon5': '2.856'} +[2023-09-14 12:49:08,810][101964] Updated weights for policy 1, policy_version 1337 (0.0013) +[2023-09-14 12:49:09,577][109198] Fps is (10 sec: 14335.9, 60 sec: 14336.0, 300 sec: 14273.5). Total num frames: 14360576. Throughput: 0: 1862.0, 1: 1707.8. Samples: 1062247. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:49:09,579][109198] Avg episode reward: [(0, '4.879'), (1, '3.890')] +[2023-09-14 12:49:12,968][101965] Updated weights for policy 0, policy_version 2175 (0.0012) +[2023-09-14 12:49:14,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14267.7, 300 sec: 14287.4). Total num frames: 14430208. Throughput: 0: 1861.8, 1: 1707.5. Samples: 1084120. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0) +[2023-09-14 12:49:14,579][109198] Avg episode reward: [(0, '4.879'), (1, '3.890')] +[2023-09-14 12:49:14,616][101964] Updated weights for policy 1, policy_version 1347 (0.0013) +[2023-09-14 12:49:17,074][102039] DAMAGECOUNT value on done: 1020.0 +[2023-09-14 12:49:17,075][102039] DAMAGECOUNT value on done: 850.0 +[2023-09-14 12:49:17,075][102039] Sum rewards: 5.581, reward structure: {'HEALTH': '-0.800', 'AMMO4': '-0.000', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.714', 'weapon3': '0.796', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon5': '2.546'} +[2023-09-14 12:49:17,463][102046] DAMAGECOUNT value on done: 1055.0 +[2023-09-14 12:49:17,463][102046] DAMAGECOUNT value on done: 1010.0 +[2023-09-14 12:49:17,463][102046] Sum rewards: 7.071, reward structure: {'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.034', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.170', 'WEAPON3': '0.200', 'weapon2': '0.240', 'weapon3': '0.612', 'weapon4': '0.662', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.550', 'weapon5': '2.378'} +[2023-09-14 12:49:17,667][102039] DAMAGECOUNT value on done: 1281.0 +[2023-09-14 12:49:17,667][102039] DAMAGECOUNT value on done: 1761.0 +[2023-09-14 12:49:17,667][102039] Sum rewards: 4.706, reward structure: {'HEALTH': '-0.050', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.024', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.196', 'WEAPON3': '0.200', 'weapon2': '0.344', 'weapon3': '0.732', 'weapon5': '0.980', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050'} +[2023-09-14 12:49:18,023][102046] DAMAGECOUNT value on done: 1600.0 +[2023-09-14 12:49:18,023][102046] DAMAGECOUNT value on done: 1109.0 +[2023-09-14 12:49:18,024][102046] Sum rewards: 4.860, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.015', 'AMMO3': '0.042', 'AMMO4': '0.074', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.568', 'weapon4': '0.584', 'FRAGCOUNT': '1.000', 'weapon5': '1.208', 'DAMAGECOUNT': '1.300', 'weapon3': '1.364'} +[2023-09-14 12:49:18,024][102046] Sum rewards: 3.149, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.025', 'AMMO3': '0.037', 'WEAPON5': '0.100', 'AMMO4': '0.127', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.532', 'weapon4': '0.600', 'weapon5': '0.732', 'weapon3': '0.790', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.000'} +[2023-09-14 12:49:18,458][101965] Updated weights for policy 0, policy_version 2185 (0.0013) +[2023-09-14 12:49:18,606][102003] DAMAGECOUNT value on done: 1625.0 +[2023-09-14 12:49:18,606][102003] DAMAGECOUNT value on done: 1505.0 +[2023-09-14 12:49:18,607][102003] Sum rewards: 5.319, reward structure: {'HEALTH': '-0.900', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'weapon2': '0.006', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.050', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.404', 'weapon3': '0.864', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.200', 'weapon5': '2.260'} +[2023-09-14 12:49:19,025][102039] DAMAGECOUNT value on done: 1430.0 +[2023-09-14 12:49:19,025][102039] DAMAGECOUNT value on done: 876.0 +[2023-09-14 12:49:19,026][102039] Sum rewards: 6.750, reward structure: {'HEALTH': '-1.580', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.039', 'WEAPON4': '0.100', 'weapon4': '0.104', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.702', 'weapon3': '1.566', 'weapon5': '1.588', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.650'} +[2023-09-14 12:49:19,026][102039] Sum rewards: 1.468, reward structure: {'HEALTH': '-2.650', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.019', 'weapon5': '0.024', 'AMMO3': '0.061', 'AMMO4': '0.094', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.344', 'WEAPON3': '0.500', 'weapon4': '0.772', 'FRAGCOUNT': '1.000', 'weapon3': '1.418', 'DAMAGECOUNT': '1.580'} +[2023-09-14 12:49:19,140][102046] DAMAGECOUNT value on done: 907.0 +[2023-09-14 12:49:19,141][102046] Sum rewards: 3.785, reward structure: {'HEALTH': '-1.740', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.024', 'AMMO3': '0.030', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.394', 'weapon4': '0.406', 'FRAGCOUNT': '1.000', 'weapon3': '1.154', 'weapon5': '1.352', 'DAMAGECOUNT': '1.450'} +[2023-09-14 12:49:19,141][102046] DAMAGECOUNT value on done: 818.0 +[2023-09-14 12:49:19,141][102046] Sum rewards: 3.286, reward structure: {'HEALTH': '-1.450', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.020', 'AMMO3': '0.048', 'WEAPON5': '0.100', 'AMMO4': '0.101', 'WEAPON4': '0.200', 'weapon5': '0.220', 'WEAPON3': '0.400', 'weapon2': '0.408', 'weapon4': '0.528', 'weapon3': '0.968', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.740'} +[2023-09-14 12:49:19,181][102003] DAMAGECOUNT value on done: 745.0 +[2023-09-14 12:49:19,182][102003] DAMAGECOUNT value on done: 900.0 +[2023-09-14 12:49:19,182][102003] Sum rewards: 5.987, reward structure: {'HEALTH': '-0.590', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.194', 'WEAPON3': '0.200', 'weapon2': '0.344', 'weapon3': '0.728', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon5': '2.806'} +[2023-09-14 12:49:19,577][109198] Fps is (10 sec: 14745.6, 60 sec: 14404.3, 300 sec: 14301.3). Total num frames: 14508032. Throughput: 0: 1865.8, 1: 1715.6. Samples: 1095410. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:49:19,579][109198] Avg episode reward: [(0, '4.875'), (1, '3.837')] +[2023-09-14 12:49:19,681][102039] DAMAGECOUNT value on done: 1071.0 +[2023-09-14 12:49:19,681][102039] DAMAGECOUNT value on done: 1250.0 +[2023-09-14 12:49:19,682][102039] Sum rewards: 3.859, reward structure: {'HEALTH': '-1.700', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.012', 'AMMO3': '0.040', 'AMMO4': '0.058', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.378', 'WEAPON3': '0.400', 'weapon2': '0.796', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.254', 'weapon5': '1.264'} +[2023-09-14 12:49:19,682][102039] Sum rewards: 4.847, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.050', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.230', 'WEAPON3': '0.400', 'weapon4': '0.562', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.300', 'weapon3': '1.340', 'weapon5': '1.610'} +[2023-09-14 12:49:19,734][102003] DAMAGECOUNT value on done: 1440.0 +[2023-09-14 12:49:19,735][102003] DAMAGECOUNT value on done: 973.0 +[2023-09-14 12:49:19,735][102003] Sum rewards: 8.128, reward structure: {'HEALTH': '-0.330', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.024', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.198', 'WEAPON3': '0.200', 'weapon2': '0.348', 'weapon3': '0.840', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.300', 'weapon5': '2.318'} +[2023-09-14 12:49:19,836][102046] DAMAGECOUNT value on done: 1040.0 +[2023-09-14 12:49:19,836][102046] DAMAGECOUNT value on done: 1445.0 +[2023-09-14 12:49:19,836][102046] Sum rewards: 1.665, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.004', 'FRAGCOUNT': '-0.001', 'AMMO2': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'weapon4': '0.098', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.150', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.434', 'weapon5': '0.866', 'weapon3': '1.374'} +[2023-09-14 12:49:20,004][102001] DAMAGECOUNT value on done: 1010.0 +[2023-09-14 12:49:20,004][102001] DAMAGECOUNT value on done: 922.0 +[2023-09-14 12:49:20,005][102001] Sum rewards: 2.330, reward structure: {'HEALTH': '-2.500', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.021', 'AMMO3': '0.070', 'AMMO4': '0.105', 'weapon5': '0.224', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon2': '0.332', 'WEAPON3': '0.600', 'weapon4': '0.714', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.350', 'weapon3': '1.798'} +[2023-09-14 12:49:20,005][102001] Sum rewards: 5.463, reward structure: {'HEALTH': '-2.250', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.008', 'AMMO5': '0.013', 'AMMO2': '0.015', 'AMMO3': '0.060', 'AMMO4': '0.074', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'WEAPON3': '0.600', 'weapon4': '0.718', 'weapon5': '0.902', 'FRAGCOUNT': '1.999', 'weapon3': '2.224', 'DAMAGECOUNT': '2.500'} +[2023-09-14 12:49:20,340][102003] DAMAGECOUNT value on done: 1360.0 +[2023-09-14 12:49:20,340][102003] DAMAGECOUNT value on done: 1069.0 +[2023-09-14 12:49:20,566][101964] Updated weights for policy 1, policy_version 1357 (0.0013) +[2023-09-14 12:49:20,614][102001] DAMAGECOUNT value on done: 940.0 +[2023-09-14 12:49:20,614][102001] DAMAGECOUNT value on done: 1270.0 +[2023-09-14 12:49:20,615][102001] Sum rewards: 6.323, reward structure: {'HEALTH': '-0.220', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'weapon2': '0.016', 'AMMO3': '0.020', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.210', 'weapon3': '0.732', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon5': '3.110'} +[2023-09-14 12:49:20,695][102004] DAMAGECOUNT value on done: 2456.0 +[2023-09-14 12:49:20,696][102004] DAMAGECOUNT value on done: 1949.0 +[2023-09-14 12:49:20,696][102004] Sum rewards: 4.023, reward structure: {'HEALTH': '-0.200', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.388', 'weapon5': '0.674', 'weapon3': '0.716', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150'} +[2023-09-14 12:49:21,296][102004] DAMAGECOUNT value on done: 1985.0 +[2023-09-14 12:49:21,296][102004] DAMAGECOUNT value on done: 2045.0 +[2023-09-14 12:49:21,297][102004] Sum rewards: 5.930, reward structure: {'HEALTH': '-4.200', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.022', 'AMMO5': '0.025', 'AMMO4': '0.108', 'AMMO3': '0.110', 'weapon2': '0.150', 'WEAPON4': '0.400', 'weapon5': '0.438', 'WEAPON5': '0.500', 'weapon4': '0.564', 'WEAPON3': '0.900', 'weapon3': '2.714', 'FRAGCOUNT': '3.999', 'DAMAGECOUNT': '4.200'} +[2023-09-14 12:49:21,296][102004] Sum rewards: 3.729, reward structure: {'DEATHCOUNT': '-4.000', 'HEALTH': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.016', 'AMMO5': '0.020', 'weapon2': '0.056', 'AMMO4': '0.078', 'AMMO3': '0.110', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'weapon4': '0.716', 'WEAPON3': '0.800', 'weapon5': '0.916', 'weapon3': '2.016', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.300'} +[2023-09-14 12:49:22,067][102001] DAMAGECOUNT value on done: 2288.0 +[2023-09-14 12:49:22,067][102001] DAMAGECOUNT value on done: 2480.0 +[2023-09-14 12:49:22,068][102001] Sum rewards: 8.040, reward structure: {'HEALTH': '-0.500', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO3': '0.020', 'AMMO4': '0.049', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.300', 'weapon2': '0.346', 'weapon3': '0.802', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050', 'weapon5': '2.558'} +[2023-09-14 12:49:22,584][102001] DAMAGECOUNT value on done: 931.0 +[2023-09-14 12:49:22,584][102001] DAMAGECOUNT value on done: 915.0 +[2023-09-14 12:49:22,585][102001] Sum rewards: 5.861, reward structure: {'HEALTH': '-0.850', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.020', 'AMMO4': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.612', 'weapon3': '0.656', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.400', 'weapon5': '2.498'} +[2023-09-14 12:49:23,739][101965] Updated weights for policy 0, policy_version 2195 (0.0012) +[2023-09-14 12:49:24,577][109198] Fps is (10 sec: 15155.2, 60 sec: 14404.3, 300 sec: 14301.3). Total num frames: 14581760. Throughput: 0: 1869.6, 1: 1722.2. Samples: 1116837. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:49:24,579][109198] Avg episode reward: [(0, '4.778'), (1, '3.744')] +[2023-09-14 12:49:26,263][101964] Updated weights for policy 1, policy_version 1367 (0.0013) +[2023-09-14 12:49:29,389][101965] Updated weights for policy 0, policy_version 2205 (0.0012) +[2023-09-14 12:49:29,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14336.0, 300 sec: 14273.5). Total num frames: 14651392. Throughput: 0: 1877.3, 1: 1733.7. Samples: 1138636. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:49:29,579][109198] Avg episode reward: [(0, '4.778'), (1, '3.744')] +[2023-09-14 12:49:32,216][101964] Updated weights for policy 1, policy_version 1377 (0.0011) +[2023-09-14 12:49:34,577][109198] Fps is (10 sec: 14335.9, 60 sec: 14336.0, 300 sec: 14287.4). Total num frames: 14725120. Throughput: 0: 1875.8, 1: 1733.6. Samples: 1149570. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:49:34,579][109198] Avg episode reward: [(0, '4.778'), (1, '3.744')] +[2023-09-14 12:49:34,697][101965] Updated weights for policy 0, policy_version 2215 (0.0014) +[2023-09-14 12:49:36,704][102037] DAMAGECOUNT value on done: 2491.0 +[2023-09-14 12:49:36,704][102037] DAMAGECOUNT value on done: 2085.0 +[2023-09-14 12:49:36,705][102037] Sum rewards: 8.156, reward structure: {'HEALTH': '-4.000', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.025', 'AMMO4': '0.126', 'AMMO3': '0.136', 'WEAPON4': '0.400', 'weapon4': '0.414', 'weapon2': '0.464', 'WEAPON5': '0.500', 'weapon5': '0.514', 'WEAPON3': '1.000', 'weapon3': '2.452', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.100'} +[2023-09-14 12:49:36,705][102037] Sum rewards: 4.449, reward structure: {'HEALTH': '-5.000', 'DEATHCOUNT': '-5.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'weapon2': '0.034', 'AMMO2': '0.038', 'AMMO3': '0.135', 'weapon5': '0.154', 'AMMO4': '0.187', 'WEAPON5': '0.500', 'WEAPON4': '0.600', 'WEAPON3': '1.000', 'weapon4': '1.174', 'weapon3': '2.452', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.150'} +[2023-09-14 12:49:37,253][102037] DAMAGECOUNT value on done: 1092.0 +[2023-09-14 12:49:37,254][102037] DAMAGECOUNT value on done: 1075.0 +[2023-09-14 12:49:37,254][102037] Sum rewards: 2.945, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.010', 'AMMO4': '0.034', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.600', 'weapon2': '0.920', 'weapon5': '1.166', 'weapon3': '1.570'} +[2023-09-14 12:49:37,620][102037] DAMAGECOUNT value on done: 2300.0 +[2023-09-14 12:49:37,620][102037] DAMAGECOUNT value on done: 2405.0 +[2023-09-14 12:49:37,621][102037] Sum rewards: 4.072, reward structure: {'HEALTH': '-4.000', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.015', 'AMMO5': '0.020', 'weapon5': '0.058', 'AMMO4': '0.074', 'AMMO3': '0.126', 'WEAPON4': '0.200', 'weapon4': '0.208', 'WEAPON5': '0.400', 'weapon2': '0.488', 'WEAPON3': '1.000', 'FRAGCOUNT': '3.000', 'weapon3': '3.132', 'DAMAGECOUNT': '3.350'} +[2023-09-14 12:49:37,621][102037] Sum rewards: 7.221, reward structure: {'HEALTH': '-3.300', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'weapon2': '0.004', 'AMMO2': '0.015', 'AMMO5': '0.020', 'AMMO4': '0.074', 'AMMO3': '0.085', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'weapon5': '0.470', 'weapon4': '0.536', 'WEAPON3': '0.800', 'weapon3': '2.916', 'DAMAGECOUNT': '4.000', 'FRAGCOUNT': '4.000'} +[2023-09-14 12:49:37,765][102005] DAMAGECOUNT value on done: 885.0 +[2023-09-14 12:49:37,765][102005] DAMAGECOUNT value on done: 928.0 +[2023-09-14 12:49:37,765][102005] Sum rewards: 4.472, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'weapon2': '0.002', 'AMMO5': '0.010', 'AMMO3': '0.046', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.212', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.346', 'weapon5': '2.506'} +[2023-09-14 12:49:37,766][102005] Sum rewards: 5.104, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.020', 'AMMO3': '0.040', 'AMMO4': '0.100', 'weapon2': '0.188', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.776', 'FRAGCOUNT': '1.000', 'weapon3': '1.326', 'DAMAGECOUNT': '1.400', 'weapon5': '1.446'} +[2023-09-14 12:49:38,130][102037] DAMAGECOUNT value on done: 1300.0 +[2023-09-14 12:49:38,130][102037] DAMAGECOUNT value on done: 1274.0 +[2023-09-14 12:49:38,131][102037] Sum rewards: 2.594, reward structure: {'HEALTH': '-2.600', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.018', 'AMMO3': '0.074', 'AMMO4': '0.091', 'weapon2': '0.130', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.600', 'weapon4': '0.644', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon5': '1.514', 'weapon3': '1.562'} +[2023-09-14 12:49:38,131][102037] Sum rewards: 6.047, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.015', 'AMMO3': '0.042', 'AMMO4': '0.074', 'weapon2': '0.128', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.250', 'WEAPON3': '0.400', 'weapon4': '0.706', 'weapon3': '1.372', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.650'} +[2023-09-14 12:49:38,225][101964] Updated weights for policy 1, policy_version 1387 (0.0012) +[2023-09-14 12:49:38,420][102005] DAMAGECOUNT value on done: 1459.0 +[2023-09-14 12:49:38,421][102005] DAMAGECOUNT value on done: 1869.0 +[2023-09-14 12:49:38,421][102005] Sum rewards: 4.193, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.011', 'AMMO3': '0.036', 'AMMO4': '0.055', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.310', 'weapon2': '0.354', 'weapon5': '0.778', 'weapon3': '0.844', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '2.500'} +[2023-09-14 12:49:39,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14472.5, 300 sec: 14273.5). Total num frames: 14794752. Throughput: 0: 1881.0, 1: 1740.4. Samples: 1170616. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:49:39,579][109198] Avg episode reward: [(0, '4.739'), (1, '3.784')] +[2023-09-14 12:49:40,324][101965] Updated weights for policy 0, policy_version 2225 (0.0015) +[2023-09-14 12:49:40,596][102040] DAMAGECOUNT value on done: 1040.0 +[2023-09-14 12:49:40,596][102040] DAMAGECOUNT value on done: 1288.0 +[2023-09-14 12:49:41,141][102040] DAMAGECOUNT value on done: 905.0 +[2023-09-14 12:49:41,141][102040] DAMAGECOUNT value on done: 628.0 +[2023-09-14 12:49:42,241][102005] DAMAGECOUNT value on done: 1223.0 +[2023-09-14 12:49:42,241][102005] DAMAGECOUNT value on done: 1123.0 +[2023-09-14 12:49:42,242][102005] Sum rewards: 4.543, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.017', 'AMMO3': '0.045', 'AMMO4': '0.085', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.398', 'WEAPON3': '0.400', 'weapon5': '0.556', 'weapon4': '0.624', 'FRAGCOUNT': '1.000', 'weapon3': '1.342', 'DAMAGECOUNT': '1.920'} +[2023-09-14 12:49:42,241][102005] Sum rewards: 2.580, reward structure: {'HEALTH': '-2.420', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.026', 'AMMO3': '0.042', 'AMMO4': '0.127', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'weapon5': '0.544', 'weapon4': '0.632', 'FRAGCOUNT': '0.999', 'weapon2': '1.066', 'DAMAGECOUNT': '1.200', 'weapon3': '1.456'} +[2023-09-14 12:49:42,816][102004] DAMAGECOUNT value on done: 2067.0 +[2023-09-14 12:49:42,816][102004] DAMAGECOUNT value on done: 1861.0 +[2023-09-14 12:49:42,849][102005] DAMAGECOUNT value on done: 2810.0 +[2023-09-14 12:49:42,850][102005] DAMAGECOUNT value on done: 2850.0 +[2023-09-14 12:49:42,850][102005] Sum rewards: 4.323, reward structure: {'HEALTH': '-5.000', 'DEATHCOUNT': '-5.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.037', 'weapon5': '0.122', 'AMMO3': '0.131', 'AMMO4': '0.186', 'weapon2': '0.232', 'WEAPON5': '0.400', 'WEAPON4': '0.400', 'weapon4': '0.860', 'WEAPON3': '1.000', 'weapon3': '2.734', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.200'} +[2023-09-14 12:49:42,851][102005] Sum rewards: 8.038, reward structure: {'DEATHCOUNT': '-4.000', 'HEALTH': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.008', 'AMMO5': '0.025', 'AMMO4': '0.038', 'AMMO3': '0.135', 'WEAPON4': '0.300', 'weapon2': '0.354', 'weapon4': '0.364', 'WEAPON5': '0.500', 'weapon5': '0.686', 'WEAPON3': '1.000', 'weapon3': '2.528', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.100'} +[2023-09-14 12:49:43,418][102004] DAMAGECOUNT value on done: 1506.0 +[2023-09-14 12:49:43,418][102004] DAMAGECOUNT value on done: 1583.0 +[2023-09-14 12:49:43,419][102004] Sum rewards: 1.540, reward structure: {'HEALTH': '-3.800', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.027', 'AMMO3': '0.072', 'WEAPON5': '0.100', 'AMMO4': '0.136', 'WEAPON4': '0.300', 'weapon2': '0.376', 'WEAPON3': '0.600', 'weapon5': '0.784', 'weapon4': '0.838', 'FRAGCOUNT': '1.000', 'weapon3': '1.742', 'DAMAGECOUNT': '2.360'} +[2023-09-14 12:49:43,419][102004] Sum rewards: 5.990, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'HITCOUNT': '0.000', 'AMMO5': '0.011', 'AMMO3': '0.080', 'WEAPON4': '0.100', 'weapon4': '0.210', 'weapon2': '0.256', 'WEAPON5': '0.300', 'WEAPON3': '0.700', 'weapon5': '1.166', 'weapon3': '2.286', 'FRAGCOUNT': '2.998', 'DAMAGECOUNT': '3.900'} +[2023-09-14 12:49:44,371][101964] Updated weights for policy 1, policy_version 1397 (0.0012) +[2023-09-14 12:49:44,577][109198] Fps is (10 sec: 13926.5, 60 sec: 14404.3, 300 sec: 14273.5). Total num frames: 14864384. Throughput: 0: 1873.5, 1: 1731.0. Samples: 1191772. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:49:44,579][109198] Avg episode reward: [(0, '4.795'), (1, '3.736')] +[2023-09-14 12:49:45,059][102040] DAMAGECOUNT value on done: 1321.0 +[2023-09-14 12:49:45,059][102040] DAMAGECOUNT value on done: 1094.0 +[2023-09-14 12:49:45,060][102040] Sum rewards: 3.823, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO4': '0.024', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon4': '0.242', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon2': '1.074', 'DAMAGECOUNT': '1.450', 'weapon3': '1.488'} +[2023-09-14 12:49:45,060][102040] Sum rewards: 4.150, reward structure: {'HEALTH': '-1.450', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.030', 'AMMO3': '0.050', 'AMMO4': '0.150', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.322', 'WEAPON3': '0.400', 'weapon4': '0.764', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.140', 'weapon5': '1.284'} +[2023-09-14 12:49:45,681][102040] DAMAGECOUNT value on done: 2190.0 +[2023-09-14 12:49:45,681][102040] DAMAGECOUNT value on done: 2125.0 +[2023-09-14 12:49:45,682][102040] Sum rewards: 3.598, reward structure: {'HEALTH': '-4.450', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.024', 'AMMO5': '0.025', 'weapon2': '0.034', 'AMMO4': '0.122', 'AMMO3': '0.142', 'WEAPON4': '0.300', 'WEAPON5': '0.500', 'weapon4': '0.554', 'weapon5': '0.980', 'WEAPON3': '1.000', 'weapon3': '2.266', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.100'} +[2023-09-14 12:49:45,682][102040] Sum rewards: 8.043, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.017', 'AMMO5': '0.020', 'AMMO4': '0.085', 'AMMO3': '0.098', 'WEAPON4': '0.200', 'weapon2': '0.238', 'WEAPON5': '0.400', 'weapon4': '0.428', 'weapon5': '0.790', 'WEAPON3': '0.800', 'weapon3': '2.366', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.600'} +[2023-09-14 12:49:46,077][101965] Updated weights for policy 0, policy_version 2235 (0.0013) +[2023-09-14 12:49:49,577][109198] Fps is (10 sec: 13926.4, 60 sec: 14404.2, 300 sec: 14259.6). Total num frames: 14934016. Throughput: 0: 1868.8, 1: 1727.1. Samples: 1202129. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:49:49,579][109198] Avg episode reward: [(0, '4.842'), (1, '3.736')] +[2023-09-14 12:49:49,586][101718] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002241_9179136.pth... +[2023-09-14 12:49:49,586][101802] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001405_5754880.pth... +[2023-09-14 12:49:49,647][101718] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001806_7397376.pth +[2023-09-14 12:49:49,648][101802] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001005_4116480.pth +[2023-09-14 12:49:50,541][101964] Updated weights for policy 1, policy_version 1407 (0.0012) +[2023-09-14 12:49:51,649][101965] Updated weights for policy 0, policy_version 2245 (0.0012) +[2023-09-14 12:49:54,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14404.5, 300 sec: 14273.5). Total num frames: 15007744. Throughput: 0: 1863.1, 1: 1724.4. Samples: 1223685. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:49:54,579][109198] Avg episode reward: [(0, '4.842'), (1, '3.736')] +[2023-09-14 12:49:55,351][102004] DAMAGECOUNT value on done: 2701.0 +[2023-09-14 12:49:55,351][102004] DAMAGECOUNT value on done: 2224.0 +[2023-09-14 12:49:55,352][102004] Sum rewards: 2.759, reward structure: {'HEALTH': '-3.750', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.015', 'AMMO5': '0.020', 'AMMO4': '0.074', 'AMMO3': '0.102', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'weapon2': '0.406', 'weapon4': '0.446', 'weapon5': '0.458', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.999', 'weapon3': '2.038', 'DAMAGECOUNT': '2.450'} +[2023-09-14 12:49:55,352][102004] Sum rewards: 5.780, reward structure: {'HEALTH': '-2.350', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.022', 'AMMO3': '0.062', 'AMMO4': '0.107', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon2': '0.328', 'weapon4': '0.496', 'WEAPON3': '0.600', 'weapon5': '0.980', 'FRAGCOUNT': '2.000', 'weapon3': '2.170', 'DAMAGECOUNT': '2.750'} +[2023-09-14 12:49:55,430][102039] DAMAGECOUNT value on done: 850.0 +[2023-09-14 12:49:55,431][102039] DAMAGECOUNT value on done: 1145.0 +[2023-09-14 12:49:55,431][102039] Sum rewards: 3.705, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon4': '0.164', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.502', 'weapon5': '0.662', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.250', 'weapon3': '1.410'} +[2023-09-14 12:49:55,909][102004] DAMAGECOUNT value on done: 2510.0 +[2023-09-14 12:49:55,909][102004] DAMAGECOUNT value on done: 2350.0 +[2023-09-14 12:49:55,910][102004] Sum rewards: 9.681, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.017', 'AMMO5': '0.020', 'AMMO3': '0.081', 'AMMO4': '0.085', 'WEAPON4': '0.300', 'weapon2': '0.362', 'WEAPON5': '0.400', 'weapon4': '0.400', 'WEAPON3': '0.700', 'weapon5': '0.782', 'weapon3': '2.284', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.250'} +[2023-09-14 12:49:55,910][102004] Sum rewards: 2.378, reward structure: {'HEALTH': '-5.050', 'DEATHCOUNT': '-5.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.058', 'AMMO3': '0.130', 'weapon2': '0.260', 'AMMO4': '0.289', 'weapon4': '0.444', 'WEAPON4': '0.500', 'WEAPON5': '0.500', 'weapon5': '0.644', 'WEAPON3': '1.000', 'weapon3': '2.528', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.050'} +[2023-09-14 12:49:56,042][102039] DAMAGECOUNT value on done: 1506.0 +[2023-09-14 12:49:56,042][102039] DAMAGECOUNT value on done: 1901.0 +[2023-09-14 12:49:56,043][102039] Sum rewards: 6.525, reward structure: {'HEALTH': '-1.400', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.025', 'AMMO3': '0.040', 'AMMO4': '0.124', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.296', 'WEAPON3': '0.400', 'weapon4': '0.868', 'weapon5': '1.130', 'weapon3': '1.382', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.250'} +[2023-09-14 12:49:56,043][102039] Sum rewards: 3.256, reward structure: {'HEALTH': '-2.250', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.011', 'AMMO5': '0.015', 'AMMO4': '0.056', 'AMMO3': '0.058', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'WEAPON3': '0.500', 'weapon4': '0.600', 'weapon5': '0.654', 'weapon2': '0.892', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.400', 'weapon3': '1.720'} +[2023-09-14 12:49:56,098][102046] DAMAGECOUNT value on done: 1105.0 +[2023-09-14 12:49:56,099][102046] DAMAGECOUNT value on done: 1260.0 +[2023-09-14 12:49:56,099][102046] Sum rewards: 5.089, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.042', 'AMMO2': '-0.008', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'AMMO3': '0.060', 'WEAPON4': '0.100', 'weapon4': '0.166', 'WEAPON5': '0.300', 'weapon5': '0.500', 'WEAPON3': '0.600', 'weapon2': '0.740', 'FRAGCOUNT': '1.998', 'weapon3': '2.162', 'DAMAGECOUNT': '2.500'} +[2023-09-14 12:49:56,395][101964] Updated weights for policy 1, policy_version 1417 (0.0012) +[2023-09-14 12:49:56,677][102046] DAMAGECOUNT value on done: 1373.0 +[2023-09-14 12:49:56,677][102046] DAMAGECOUNT value on done: 1830.0 +[2023-09-14 12:49:56,678][102046] Sum rewards: 5.055, reward structure: {'HEALTH': '-2.250', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.012', 'AMMO5': '0.015', 'AMMO4': '0.059', 'AMMO3': '0.068', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon5': '0.466', 'weapon2': '0.490', 'WEAPON3': '0.600', 'weapon4': '0.670', 'weapon3': '1.784', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.640'} +[2023-09-14 12:49:56,678][102046] Sum rewards: 4.563, reward structure: {'HEALTH': '-2.610', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.024', 'AMMO3': '0.066', 'AMMO4': '0.119', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon2': '0.338', 'weapon5': '0.594', 'WEAPON3': '0.600', 'weapon4': '0.676', 'weapon3': '1.842', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.300'} +[2023-09-14 12:49:56,745][102003] DAMAGECOUNT value on done: 1845.0 +[2023-09-14 12:49:56,745][102003] DAMAGECOUNT value on done: 2030.0 +[2023-09-14 12:49:56,745][102003] Sum rewards: 3.697, reward structure: {'HEALTH': '-4.000', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.001', 'AMMO4': '0.005', 'AMMO5': '0.020', 'AMMO3': '0.098', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'weapon5': '0.410', 'weapon4': '0.466', 'weapon2': '0.788', 'WEAPON3': '0.800', 'weapon3': '2.108', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.400'} +[2023-09-14 12:49:56,746][102003] Sum rewards: 7.576, reward structure: {'HEALTH': '-3.250', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'weapon2': '0.004', 'AMMO5': '0.020', 'AMMO2': '0.027', 'AMMO3': '0.093', 'AMMO4': '0.132', 'WEAPON4': '0.400', 'WEAPON5': '0.400', 'weapon4': '0.522', 'WEAPON3': '0.800', 'weapon5': '0.814', 'weapon3': '2.564', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.050'} +[2023-09-14 12:49:57,122][101965] Updated weights for policy 0, policy_version 2255 (0.0013) +[2023-09-14 12:49:57,173][102039] DAMAGECOUNT value on done: 1600.0 +[2023-09-14 12:49:57,174][102039] DAMAGECOUNT value on done: 993.0 +[2023-09-14 12:49:57,174][102039] Sum rewards: 5.361, reward structure: {'HEALTH': '-1.120', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.230', 'WEAPON3': '0.400', 'weapon2': '0.642', 'FRAGCOUNT': '1.000', 'weapon3': '1.432', 'DAMAGECOUNT': '1.700', 'weapon5': '1.728'} +[2023-09-14 12:49:57,175][102039] Sum rewards: 1.976, reward structure: {'HEALTH': '-1.650', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.004', 'AMMO4': '0.022', 'AMMO3': '0.049', 'weapon2': '0.056', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.312', 'weapon5': '0.312', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon3': '1.098', 'DAMAGECOUNT': '1.170'} +[2023-09-14 12:49:57,338][102003] DAMAGECOUNT value on done: 1165.0 +[2023-09-14 12:49:57,339][102003] DAMAGECOUNT value on done: 1110.0 +[2023-09-14 12:49:57,339][102003] Sum rewards: 9.257, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.060', 'WEAPON4': '0.100', 'weapon4': '0.206', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.762', 'weapon5': '0.820', 'weapon3': '2.196', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.200'} +[2023-09-14 12:49:57,340][102003] Sum rewards: 1.402, reward structure: {'HEALTH': '-4.000', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.023', 'AMMO4': '0.115', 'AMMO3': '0.125', 'weapon5': '0.132', 'WEAPON5': '0.200', 'WEAPON4': '0.400', 'weapon2': '0.630', 'weapon4': '0.876', 'WEAPON3': '0.900', 'weapon3': '1.890', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:49:57,762][102039] DAMAGECOUNT value on done: 1096.0 +[2023-09-14 12:49:57,763][102039] DAMAGECOUNT value on done: 1325.0 +[2023-09-14 12:49:57,916][102003] DAMAGECOUNT value on done: 1148.0 +[2023-09-14 12:49:57,917][102003] Sum rewards: 4.786, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.029', 'AMMO3': '0.045', 'WEAPON5': '0.100', 'AMMO4': '0.143', 'weapon2': '0.146', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon5': '0.700', 'weapon4': '0.830', 'FRAGCOUNT': '1.000', 'weapon3': '1.438', 'DAMAGECOUNT': '1.750'} +[2023-09-14 12:49:57,917][102003] DAMAGECOUNT value on done: 1540.0 +[2023-09-14 12:49:57,918][102003] Sum rewards: 3.845, reward structure: {'HEALTH': '-1.700', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.016', 'weapon2': '0.038', 'AMMO3': '0.039', 'AMMO4': '0.077', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.496', 'weapon3': '0.882', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon5': '2.392'} +[2023-09-14 12:49:57,965][102046] DAMAGECOUNT value on done: 1007.0 +[2023-09-14 12:49:57,965][102046] DAMAGECOUNT value on done: 921.0 +[2023-09-14 12:49:57,966][102046] Sum rewards: 4.426, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.007', 'AMMO4': '0.033', 'AMMO3': '0.047', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon2': '0.278', 'WEAPON3': '0.400', 'weapon4': '0.406', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.212', 'weapon5': '1.838'} +[2023-09-14 12:49:57,966][102046] Sum rewards: 2.686, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.015', 'AMMO3': '0.030', 'AMMO4': '0.075', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.376', 'weapon4': '0.602', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.030', 'weapon3': '1.058'} +[2023-09-14 12:49:58,493][102003] DAMAGECOUNT value on done: 1470.0 +[2023-09-14 12:49:58,494][102003] DAMAGECOUNT value on done: 1211.0 +[2023-09-14 12:49:58,494][102003] Sum rewards: 4.061, reward structure: {'HEALTH': '-1.320', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.011', 'weapon2': '0.018', 'AMMO3': '0.052', 'AMMO4': '0.054', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.406', 'FRAGCOUNT': '1.000', 'weapon3': '1.038', 'DAMAGECOUNT': '1.100', 'weapon5': '1.892'} +[2023-09-14 12:49:58,495][102003] Sum rewards: 3.235, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.004', 'AMMO2': '0.033', 'AMMO3': '0.054', 'WEAPON5': '0.100', 'AMMO4': '0.163', 'weapon2': '0.282', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon5': '0.896', 'weapon4': '0.916', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.420', 'weapon3': '1.568'} +[2023-09-14 12:49:58,731][102046] DAMAGECOUNT value on done: 1115.0 +[2023-09-14 12:49:58,731][102046] DAMAGECOUNT value on done: 1565.0 +[2023-09-14 12:49:58,732][102046] Sum rewards: 4.753, reward structure: {'HEALTH': '-0.750', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'AMMO2': '0.026', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.132', 'WEAPON3': '0.200', 'weapon2': '0.200', 'weapon3': '0.626', 'weapon4': '0.662', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.200', 'weapon5': '1.234'} +[2023-09-14 12:49:59,355][102001] DAMAGECOUNT value on done: 1010.0 +[2023-09-14 12:49:59,356][102001] DAMAGECOUNT value on done: 942.0 +[2023-09-14 12:49:59,577][109198] Fps is (10 sec: 13926.4, 60 sec: 14267.7, 300 sec: 14259.6). Total num frames: 15073280. Throughput: 0: 1841.9, 1: 1725.2. Samples: 1244639. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0) +[2023-09-14 12:49:59,579][109198] Avg episode reward: [(0, '4.852'), (1, '3.569')] +[2023-09-14 12:49:59,892][102001] DAMAGECOUNT value on done: 1450.0 +[2023-09-14 12:49:59,892][102001] DAMAGECOUNT value on done: 1182.0 +[2023-09-14 12:49:59,892][102001] Sum rewards: 4.326, reward structure: {'HEALTH': '-2.350', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.017', 'AMMO3': '0.068', 'AMMO4': '0.084', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon2': '0.588', 'weapon5': '0.596', 'WEAPON3': '0.600', 'weapon4': '0.600', 'DAMAGECOUNT': '1.800', 'weapon3': '1.808', 'FRAGCOUNT': '2.000'} +[2023-09-14 12:49:59,893][102001] Sum rewards: 5.469, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.006', 'AMMO5': '0.015', 'AMMO4': '0.027', 'AMMO3': '0.060', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon2': '0.376', 'weapon4': '0.410', 'WEAPON3': '0.600', 'weapon5': '0.882', 'FRAGCOUNT': '2.000', 'weapon3': '2.174', 'DAMAGECOUNT': '2.420'} +[2023-09-14 12:50:01,305][102001] DAMAGECOUNT value on done: 2698.0 +[2023-09-14 12:50:01,305][102001] DAMAGECOUNT value on done: 3320.0 +[2023-09-14 12:50:01,306][102001] Sum rewards: -0.658, reward structure: {'HEALTH': '-8.100', 'DEATHCOUNT': '-8.000', 'HITCOUNT': '0.000', 'weapon2': '0.034', 'AMMO2': '0.039', 'AMMO5': '0.040', 'AMMO4': '0.193', 'AMMO3': '0.283', 'WEAPON4': '0.500', 'weapon4': '0.500', 'WEAPON5': '0.800', 'weapon5': '0.966', 'WEAPON3': '1.700', 'weapon3': '2.286', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.100'} +[2023-09-14 12:50:01,306][102001] Sum rewards: 14.288, reward structure: {'HEALTH': '-4.050', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.028', 'weapon4': '0.078', 'AMMO3': '0.122', 'AMMO4': '0.139', 'weapon5': '0.194', 'WEAPON4': '0.200', 'WEAPON5': '0.500', 'weapon2': '0.694', 'WEAPON3': '1.000', 'weapon3': '2.958', 'FRAGCOUNT': '8.000', 'DAMAGECOUNT': '8.400'} +[2023-09-14 12:50:01,785][101964] Updated weights for policy 1, policy_version 1427 (0.0014) +[2023-09-14 12:50:01,896][102001] DAMAGECOUNT value on done: 1081.0 +[2023-09-14 12:50:01,897][102001] Sum rewards: 1.236, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO5': '0.005', 'AMMO2': '0.025', 'AMMO3': '0.068', 'WEAPON5': '0.100', 'AMMO4': '0.124', 'WEAPON4': '0.300', 'weapon5': '0.530', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon4': '1.174', 'DAMAGECOUNT': '1.500', 'weapon3': '1.808'} +[2023-09-14 12:50:01,896][102001] DAMAGECOUNT value on done: 1221.0 +[2023-09-14 12:50:01,897][102001] Sum rewards: 7.246, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.010', 'AMMO3': '0.043', 'AMMO4': '0.049', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.300', 'WEAPON3': '0.400', 'weapon2': '0.462', 'weapon4': '0.508', 'weapon3': '1.504', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.060'} +[2023-09-14 12:50:03,337][101965] Updated weights for policy 0, policy_version 2265 (0.0012) +[2023-09-14 12:50:04,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14404.3, 300 sec: 14287.4). Total num frames: 15151104. Throughput: 0: 1828.8, 1: 1733.1. Samples: 1255695. Policy #0 lag: (min: 0.0, avg: 0.5, max: 1.0) +[2023-09-14 12:50:04,579][109198] Avg episode reward: [(0, '4.863'), (1, '3.563')] +[2023-09-14 12:50:07,157][101964] Updated weights for policy 1, policy_version 1437 (0.0012) +[2023-09-14 12:50:09,479][101965] Updated weights for policy 0, policy_version 2275 (0.0016) +[2023-09-14 12:50:09,577][109198] Fps is (10 sec: 14745.7, 60 sec: 14336.0, 300 sec: 14287.4). Total num frames: 15220736. Throughput: 0: 1803.2, 1: 1755.1. Samples: 1276958. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0) +[2023-09-14 12:50:09,579][109198] Avg episode reward: [(0, '4.863'), (1, '3.563')] +[2023-09-14 12:50:12,656][101964] Updated weights for policy 1, policy_version 1447 (0.0012) +[2023-09-14 12:50:13,773][102037] DAMAGECOUNT value on done: 2786.0 +[2023-09-14 12:50:13,773][102037] DAMAGECOUNT value on done: 2275.0 +[2023-09-14 12:50:13,773][102037] Sum rewards: 6.938, reward structure: {'HEALTH': '-1.850', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.026', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.400', 'weapon2': '0.520', 'weapon3': '1.416', 'weapon5': '1.620', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.950'} +[2023-09-14 12:50:13,774][102037] Sum rewards: 3.003, reward structure: {'HEALTH': '-2.900', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.015', 'AMMO5': '0.015', 'AMMO3': '0.061', 'AMMO4': '0.074', 'weapon2': '0.106', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.514', 'WEAPON3': '0.600', 'weapon5': '0.996', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.900', 'weapon3': '2.122'} +[2023-09-14 12:50:14,340][102037] DAMAGECOUNT value on done: 1252.0 +[2023-09-14 12:50:14,340][102037] DAMAGECOUNT value on done: 1175.0 +[2023-09-14 12:50:14,341][102037] Sum rewards: 5.029, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.025', 'AMMO3': '0.040', 'AMMO4': '0.124', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.248', 'WEAPON3': '0.400', 'weapon5': '0.764', 'weapon4': '0.890', 'FRAGCOUNT': '1.000', 'weapon3': '1.528', 'DAMAGECOUNT': '1.600'} +[2023-09-14 12:50:14,341][102037] Sum rewards: 4.288, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.025', 'AMMO3': '0.039', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.310', 'WEAPON3': '0.400', 'weapon2': '0.678', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.000', 'weapon3': '1.450', 'weapon5': '1.570'} +[2023-09-14 12:50:14,523][102037] DAMAGECOUNT value on done: 2610.0 +[2023-09-14 12:50:14,524][102037] DAMAGECOUNT value on done: 2680.0 +[2023-09-14 12:50:14,524][102037] Sum rewards: 6.485, reward structure: {'HEALTH': '-2.700', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.015', 'AMMO4': '0.036', 'AMMO3': '0.060', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'weapon4': '0.300', 'weapon5': '0.550', 'WEAPON3': '0.600', 'weapon2': '0.762', 'weapon3': '2.354', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.100'} +[2023-09-14 12:50:14,525][102037] Sum rewards: 4.057, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.025', 'AMMO3': '0.060', 'AMMO4': '0.125', 'WEAPON4': '0.200', 'weapon4': '0.202', 'WEAPON5': '0.300', 'weapon2': '0.348', 'WEAPON3': '0.600', 'weapon5': '1.206', 'FRAGCOUNT': '2.000', 'weapon3': '2.226', 'DAMAGECOUNT': '2.750'} +[2023-09-14 12:50:14,577][109198] Fps is (10 sec: 13926.5, 60 sec: 14336.0, 300 sec: 14287.4). Total num frames: 15290368. Throughput: 0: 1776.5, 1: 1774.9. Samples: 1298450. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:50:14,579][109198] Avg episode reward: [(0, '4.923'), (1, '3.549')] +[2023-09-14 12:50:15,125][102037] DAMAGECOUNT value on done: 1515.0 +[2023-09-14 12:50:15,125][102037] DAMAGECOUNT value on done: 1579.0 +[2023-09-14 12:50:15,126][102037] Sum rewards: 3.372, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.109', 'WEAPON4': '0.200', 'weapon4': '0.202', 'WEAPON5': '0.300', 'weapon5': '0.728', 'WEAPON3': '0.800', 'weapon2': '0.946', 'weapon3': '1.924', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150'} +[2023-09-14 12:50:15,126][102037] Sum rewards: 6.703, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.015', 'AMMO4': '0.072', 'AMMO3': '0.076', 'weapon2': '0.174', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.600', 'weapon4': '0.724', 'weapon5': '0.910', 'weapon3': '1.672', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.050'} +[2023-09-14 12:50:15,244][102005] DAMAGECOUNT value on done: 1195.0 +[2023-09-14 12:50:15,244][102005] DAMAGECOUNT value on done: 1218.0 +[2023-09-14 12:50:15,245][102005] Sum rewards: 6.650, reward structure: {'HEALTH': '-2.800', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.026', 'weapon2': '0.058', 'AMMO3': '0.073', 'AMMO4': '0.131', 'WEAPON4': '0.200', 'weapon4': '0.280', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon3': '1.678', 'weapon5': '1.988', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.100'} +[2023-09-14 12:50:15,245][102005] Sum rewards: 3.185, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.021', 'AMMO3': '0.076', 'WEAPON5': '0.100', 'AMMO4': '0.103', 'WEAPON4': '0.200', 'weapon5': '0.306', 'weapon2': '0.578', 'WEAPON3': '0.600', 'weapon4': '0.714', 'weapon3': '1.582', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.900'} +[2023-09-14 12:50:15,480][101965] Updated weights for policy 0, policy_version 2285 (0.0013) +[2023-09-14 12:50:15,926][102005] DAMAGECOUNT value on done: 1764.0 +[2023-09-14 12:50:15,926][102005] DAMAGECOUNT value on done: 2079.0 +[2023-09-14 12:50:15,926][102005] Sum rewards: 7.152, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.015', 'AMMO4': '0.020', 'AMMO3': '0.066', 'weapon2': '0.164', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.482', 'WEAPON3': '0.600', 'weapon5': '1.390', 'weapon3': '1.860', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.050'} +[2023-09-14 12:50:15,927][102005] Sum rewards: 3.103, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.020', 'AMMO3': '0.070', 'AMMO4': '0.099', 'WEAPON5': '0.200', 'weapon5': '0.392', 'WEAPON4': '0.400', 'weapon2': '0.440', 'WEAPON3': '0.600', 'weapon4': '1.112', 'weapon3': '1.660', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:50:17,817][102040] DAMAGECOUNT value on done: 1323.0 +[2023-09-14 12:50:17,817][102040] DAMAGECOUNT value on done: 1040.0 +[2023-09-14 12:50:17,818][102040] Sum rewards: 2.562, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.025', 'AMMO3': '0.030', 'WEAPON5': '0.100', 'AMMO4': '0.125', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.332', 'DAMAGECOUNT': '0.350', 'weapon4': '0.812', 'weapon3': '1.020', 'weapon5': '1.266'} +[2023-09-14 12:50:18,077][101964] Updated weights for policy 1, policy_version 1457 (0.0011) +[2023-09-14 12:50:18,344][102040] DAMAGECOUNT value on done: 718.0 +[2023-09-14 12:50:18,344][102040] DAMAGECOUNT value on done: 925.0 +[2023-09-14 12:50:19,577][109198] Fps is (10 sec: 13926.4, 60 sec: 14199.5, 300 sec: 14259.6). Total num frames: 15360000. Throughput: 0: 1759.7, 1: 1783.3. Samples: 1309008. Policy #0 lag: (min: 0.0, avg: 0.5, max: 1.0) +[2023-09-14 12:50:19,579][109198] Avg episode reward: [(0, '4.939'), (1, '3.515')] +[2023-09-14 12:50:19,853][102005] DAMAGECOUNT value on done: 1288.0 +[2023-09-14 12:50:19,853][102005] DAMAGECOUNT value on done: 1353.0 +[2023-09-14 12:50:20,264][102004] DAMAGECOUNT value on done: 2507.0 +[2023-09-14 12:50:20,264][102004] DAMAGECOUNT value on done: 2226.0 +[2023-09-14 12:50:20,264][102004] Sum rewards: 7.115, reward structure: {'HEALTH': '-3.600', 'DEATHCOUNT': '-3.000', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO3': '0.095', 'WEAPON4': '0.200', 'weapon2': '0.314', 'weapon4': '0.372', 'WEAPON5': '0.400', 'weapon5': '0.774', 'WEAPON3': '0.800', 'weapon3': '2.348', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.400'} +[2023-09-14 12:50:20,265][102004] Sum rewards: 4.485, reward structure: {'HEALTH': '-4.250', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.026', 'weapon2': '0.112', 'AMMO4': '0.131', 'AMMO3': '0.131', 'WEAPON4': '0.400', 'weapon5': '0.422', 'WEAPON5': '0.500', 'weapon4': '0.684', 'WEAPON3': '1.000', 'weapon3': '2.654', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.650'} +[2023-09-14 12:50:20,424][102005] DAMAGECOUNT value on done: 3230.0 +[2023-09-14 12:50:20,424][102005] DAMAGECOUNT value on done: 3360.0 +[2023-09-14 12:50:20,425][102005] Sum rewards: 4.159, reward structure: {'DEATHCOUNT': '-5.000', 'HEALTH': '-5.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.025', 'AMMO3': '0.119', 'AMMO4': '0.126', 'weapon2': '0.294', 'WEAPON5': '0.400', 'WEAPON4': '0.500', 'weapon5': '0.560', 'weapon4': '0.670', 'WEAPON3': '0.900', 'weapon3': '2.344', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.200'} +[2023-09-14 12:50:20,425][102005] Sum rewards: 8.220, reward structure: {'HEALTH': '-4.000', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'weapon2': '0.006', 'AMMO5': '0.025', 'AMMO2': '0.031', 'AMMO3': '0.120', 'AMMO4': '0.157', 'weapon5': '0.310', 'WEAPON4': '0.400', 'WEAPON5': '0.500', 'weapon4': '0.616', 'WEAPON3': '1.000', 'weapon3': '2.954', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.100'} +[2023-09-14 12:50:20,867][102004] DAMAGECOUNT value on done: 1781.0 +[2023-09-14 12:50:20,867][102004] DAMAGECOUNT value on done: 2018.0 +[2023-09-14 12:50:20,868][102004] Sum rewards: 1.956, reward structure: {'HEALTH': '-4.150', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.027', 'AMMO3': '0.117', 'AMMO4': '0.136', 'WEAPON5': '0.300', 'WEAPON4': '0.400', 'weapon2': '0.490', 'weapon5': '0.508', 'WEAPON3': '0.800', 'weapon4': '1.030', 'weapon3': '1.532', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.750'} +[2023-09-14 12:50:20,868][102004] Sum rewards: 8.919, reward structure: {'HEALTH': '-2.600', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO4': '0.007', 'AMMO5': '0.015', 'AMMO3': '0.059', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.434', 'weapon2': '0.526', 'WEAPON3': '0.600', 'weapon5': '0.718', 'weapon3': '2.308', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.350'} +[2023-09-14 12:50:21,372][101965] Updated weights for policy 0, policy_version 2295 (0.0015) +[2023-09-14 12:50:22,085][102040] DAMAGECOUNT value on done: 1521.0 +[2023-09-14 12:50:22,085][102040] DAMAGECOUNT value on done: 1134.0 +[2023-09-14 12:50:22,085][102040] Sum rewards: 7.845, reward structure: {'HEALTH': '-0.400', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.019', 'AMMO2': '0.030', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.150', 'WEAPON3': '0.200', 'weapon2': '0.384', 'weapon3': '0.674', 'weapon4': '0.758', 'weapon5': '1.824', 'DAMAGECOUNT': '2.000', 'FRAGCOUNT': '2.000'} +[2023-09-14 12:50:22,646][102040] DAMAGECOUNT value on done: 2710.0 +[2023-09-14 12:50:22,646][102040] DAMAGECOUNT value on done: 2405.0 +[2023-09-14 12:50:22,647][102040] Sum rewards: 10.811, reward structure: {'HEALTH': '-2.700', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.027', 'AMMO3': '0.063', 'AMMO4': '0.134', 'WEAPON4': '0.200', 'weapon2': '0.262', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon5': '0.772', 'weapon4': '0.812', 'weapon3': '2.126', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.200'} +[2023-09-14 12:50:22,647][102040] Sum rewards: 0.880, reward structure: {'HEALTH': '-5.150', 'DEATHCOUNT': '-5.000', 'HITCOUNT': '0.000', 'weapon2': '0.006', 'AMMO2': '0.008', 'AMMO5': '0.030', 'AMMO4': '0.039', 'AMMO3': '0.163', 'WEAPON4': '0.300', 'weapon4': '0.514', 'WEAPON5': '0.600', 'weapon5': '0.786', 'WEAPON3': '1.200', 'FRAGCOUNT': '2.000', 'weapon3': '2.584', 'DAMAGECOUNT': '2.800'} +[2023-09-14 12:50:23,671][101964] Updated weights for policy 1, policy_version 1467 (0.0014) +[2023-09-14 12:50:24,577][109198] Fps is (10 sec: 14335.9, 60 sec: 14199.5, 300 sec: 14245.8). Total num frames: 15433728. Throughput: 0: 1749.1, 1: 1792.9. Samples: 1330006. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:50:24,579][109198] Avg episode reward: [(0, '5.024'), (1, '3.466')] +[2023-09-14 12:50:24,580][101718] Saving new best policy, reward=5.024! +[2023-09-14 12:50:27,161][101965] Updated weights for policy 0, policy_version 2305 (0.0015) +[2023-09-14 12:50:29,324][101964] Updated weights for policy 1, policy_version 1477 (0.0014) +[2023-09-14 12:50:29,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14199.5, 300 sec: 14245.7). Total num frames: 15503360. Throughput: 0: 1736.6, 1: 1817.6. Samples: 1351714. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:50:29,579][109198] Avg episode reward: [(0, '5.024'), (1, '3.466')] +[2023-09-14 12:50:32,613][102004] DAMAGECOUNT value on done: 2841.0 +[2023-09-14 12:50:32,614][102004] DAMAGECOUNT value on done: 2324.0 +[2023-09-14 12:50:32,614][102004] Sum rewards: 4.315, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.029', 'AMMO3': '0.039', 'AMMO4': '0.146', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon2': '0.396', 'WEAPON3': '0.400', 'weapon5': '0.490', 'weapon4': '0.710', 'FRAGCOUNT': '1.000', 'weapon3': '1.294', 'DAMAGECOUNT': '1.400'} +[2023-09-14 12:50:32,614][102004] Sum rewards: 4.486, reward structure: {'HEALTH': '-1.350', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.009', 'AMMO5': '0.010', 'AMMO3': '0.039', 'AMMO4': '0.043', 'WEAPON4': '0.100', 'weapon4': '0.154', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.406', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.468', 'weapon5': '2.006'} +[2023-09-14 12:50:33,122][102004] DAMAGECOUNT value on done: 2725.0 +[2023-09-14 12:50:33,122][102004] DAMAGECOUNT value on done: 2455.0 +[2023-09-14 12:50:33,122][102004] Sum rewards: 6.469, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.030', 'AMMO3': '0.034', 'AMMO4': '0.150', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon2': '0.266', 'WEAPON3': '0.300', 'weapon3': '0.830', 'weapon4': '0.938', 'weapon5': '1.360', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150'} +[2023-09-14 12:50:33,123][102004] Sum rewards: 2.917, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.009', 'AMMO4': '0.024', 'AMMO3': '0.075', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.392', 'weapon2': '0.508', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon5': '1.244', 'weapon3': '1.610'} +[2023-09-14 12:50:33,208][101965] Updated weights for policy 0, policy_version 2315 (0.0014) +[2023-09-14 12:50:33,821][102039] DAMAGECOUNT value on done: 975.0 +[2023-09-14 12:50:33,821][102039] DAMAGECOUNT value on done: 1195.0 +[2023-09-14 12:50:33,822][102039] Sum rewards: 4.619, reward structure: {'HEALTH': '-0.500', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.020', 'weapon2': '0.038', 'AMMO4': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon3': '0.604', 'weapon4': '0.614', 'FRAGCOUNT': '1.000', 'weapon5': '1.068', 'DAMAGECOUNT': '1.250'} +[2023-09-14 12:50:34,275][102046] DAMAGECOUNT value on done: 1280.0 +[2023-09-14 12:50:34,276][102046] Sum rewards: 3.900, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.025', 'AMMO3': '0.030', 'WEAPON5': '0.100', 'AMMO4': '0.124', 'weapon2': '0.132', 'WEAPON4': '0.200', 'weapon5': '0.240', 'WEAPON3': '0.300', 'weapon4': '0.880', 'FRAGCOUNT': '1.000', 'weapon3': '1.114', 'DAMAGECOUNT': '1.750'} +[2023-09-14 12:50:34,277][102046] DAMAGECOUNT value on done: 1360.0 +[2023-09-14 12:50:34,277][102046] Sum rewards: 4.271, reward structure: {'HEALTH': '-1.750', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.020', 'AMMO3': '0.045', 'AMMO4': '0.100', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.220', 'WEAPON3': '0.400', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.410', 'weapon5': '2.416'} +[2023-09-14 12:50:34,369][102039] DAMAGECOUNT value on done: 1708.0 +[2023-09-14 12:50:34,369][102039] DAMAGECOUNT value on done: 2137.0 +[2023-09-14 12:50:34,369][102039] Sum rewards: 3.983, reward structure: {'HEALTH': '-2.200', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.020', 'AMMO3': '0.050', 'AMMO4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.232', 'WEAPON4': '0.300', 'weapon2': '0.382', 'WEAPON3': '0.500', 'weapon4': '0.702', 'weapon3': '1.666', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.020'} +[2023-09-14 12:50:34,370][102039] Sum rewards: 5.027, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.012', 'AMMO2': '0.025', 'AMMO3': '0.063', 'AMMO4': '0.126', 'weapon2': '0.286', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'WEAPON3': '0.500', 'weapon5': '0.856', 'weapon4': '0.866', 'weapon3': '1.332', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.360'} +[2023-09-14 12:50:34,577][109198] Fps is (10 sec: 14336.1, 60 sec: 14199.5, 300 sec: 14259.6). Total num frames: 15577088. Throughput: 0: 1727.4, 1: 1825.7. Samples: 1362018. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:50:34,579][109198] Avg episode reward: [(0, '5.047'), (1, '3.499')] +[2023-09-14 12:50:34,580][101718] Saving new best policy, reward=5.047! +[2023-09-14 12:50:34,849][101964] Updated weights for policy 1, policy_version 1487 (0.0013) +[2023-09-14 12:50:34,873][102003] DAMAGECOUNT value on done: 2525.0 +[2023-09-14 12:50:34,874][102003] DAMAGECOUNT value on done: 2285.0 +[2023-09-14 12:50:34,874][102003] Sum rewards: 6.061, reward structure: {'HEALTH': '-4.400', 'DEATHCOUNT': '-4.000', 'AMMO4': '-0.049', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO3': '0.124', 'weapon5': '0.286', 'WEAPON5': '0.500', 'weapon2': '0.730', 'WEAPON3': '1.000', 'weapon3': '2.904', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.950'} +[2023-09-14 12:50:34,875][102003] Sum rewards: 5.452, reward structure: {'HEALTH': '-4.700', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.025', 'AMMO4': '0.036', 'AMMO3': '0.119', 'WEAPON4': '0.300', 'weapon4': '0.376', 'weapon2': '0.382', 'WEAPON5': '0.500', 'weapon5': '0.836', 'WEAPON3': '0.900', 'weapon3': '2.270', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.400'} +[2023-09-14 12:50:34,920][102046] DAMAGECOUNT value on done: 1581.0 +[2023-09-14 12:50:34,921][102046] Sum rewards: 3.551, reward structure: {'HEALTH': '-2.200', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.018', 'weapon5': '0.034', 'AMMO3': '0.058', 'AMMO4': '0.092', 'WEAPON5': '0.100', 'WEAPON4': '0.300', 'weapon2': '0.348', 'WEAPON3': '0.500', 'weapon4': '0.786', 'weapon3': '1.430', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.080'} +[2023-09-14 12:50:34,921][102046] DAMAGECOUNT value on done: 2060.0 +[2023-09-14 12:50:34,921][102046] Sum rewards: 5.146, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.019', 'AMMO3': '0.071', 'AMMO4': '0.095', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.272', 'WEAPON3': '0.600', 'weapon4': '0.796', 'weapon5': '0.802', 'weapon3': '1.780', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.300'} +[2023-09-14 12:50:35,418][102003] DAMAGECOUNT value on done: 1380.0 +[2023-09-14 12:50:35,418][102003] DAMAGECOUNT value on done: 1370.0 +[2023-09-14 12:50:35,418][102003] Sum rewards: 4.700, reward structure: {'HEALTH': '-2.550', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO5': '0.015', 'AMMO2': '0.017', 'AMMO3': '0.079', 'AMMO4': '0.085', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'WEAPON3': '0.600', 'weapon4': '0.666', 'weapon3': '1.416', 'weapon5': '1.620', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150'} +[2023-09-14 12:50:35,419][102003] Sum rewards: 4.086, reward structure: {'HEALTH': '-2.050', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.015', 'weapon2': '0.056', 'weapon5': '0.056', 'AMMO3': '0.063', 'AMMO4': '0.075', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'weapon4': '0.950', 'weapon3': '1.310', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.600'} +[2023-09-14 12:50:35,496][102039] DAMAGECOUNT value on done: 1755.0 +[2023-09-14 12:50:35,496][102039] DAMAGECOUNT value on done: 1033.0 +[2023-09-14 12:50:35,496][102039] Sum rewards: 6.674, reward structure: {'HEALTH': '-0.400', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.019', 'weapon4': '0.096', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.380', 'weapon3': '0.700', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.550', 'weapon5': '2.924'} +[2023-09-14 12:50:35,934][102003] DAMAGECOUNT value on done: 1700.0 +[2023-09-14 12:50:35,935][102003] DAMAGECOUNT value on done: 1273.0 +[2023-09-14 12:50:35,936][102003] Sum rewards: 5.108, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.304', 'weapon2': '0.394', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon3': '1.396', 'DAMAGECOUNT': '1.600', 'weapon5': '1.814'} +[2023-09-14 12:50:35,936][102003] Sum rewards: 3.962, reward structure: {'HEALTH': '-1.550', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.013', 'AMMO3': '0.048', 'AMMO4': '0.064', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.352', 'WEAPON3': '0.400', 'weapon2': '0.672', 'FRAGCOUNT': '1.000', 'weapon3': '1.018', 'DAMAGECOUNT': '1.250', 'weapon5': '1.490'} +[2023-09-14 12:50:36,079][102039] DAMAGECOUNT value on done: 1326.0 +[2023-09-14 12:50:36,080][102039] DAMAGECOUNT value on done: 1365.0 +[2023-09-14 12:50:36,080][102039] Sum rewards: 6.084, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.031', 'AMMO3': '0.032', 'WEAPON5': '0.100', 'AMMO4': '0.154', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.450', 'weapon4': '0.460', 'weapon3': '0.928', 'FRAGCOUNT': '1.000', 'weapon5': '2.126', 'DAMAGECOUNT': '2.300'} +[2023-09-14 12:50:36,216][102046] DAMAGECOUNT value on done: 1222.0 +[2023-09-14 12:50:36,216][102046] DAMAGECOUNT value on done: 1111.0 +[2023-09-14 12:50:36,217][102046] Sum rewards: 5.346, reward structure: {'HEALTH': '-1.900', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.050', 'weapon2': '0.070', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.602', 'weapon5': '1.184', 'weapon3': '1.332', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.150'} +[2023-09-14 12:50:36,217][102046] Sum rewards: 3.396, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.019', 'AMMO3': '0.072', 'AMMO4': '0.093', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon2': '0.416', 'weapon5': '0.442', 'WEAPON3': '0.600', 'weapon4': '0.712', 'FRAGCOUNT': '1.000', 'weapon3': '1.836', 'DAMAGECOUNT': '1.900'} +[2023-09-14 12:50:36,501][102003] DAMAGECOUNT value on done: 1560.0 +[2023-09-14 12:50:36,501][102003] DAMAGECOUNT value on done: 1366.0 +[2023-09-14 12:50:36,502][102003] Sum rewards: 5.845, reward structure: {'HEALTH': '-0.900', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.030', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.150', 'WEAPON3': '0.200', 'weapon2': '0.474', 'weapon4': '0.678', 'weapon3': '0.698', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.550', 'weapon5': '1.740'} +[2023-09-14 12:50:36,780][102046] DAMAGECOUNT value on done: 1235.0 +[2023-09-14 12:50:36,781][102046] DAMAGECOUNT value on done: 1715.0 +[2023-09-14 12:50:36,781][102046] Sum rewards: 4.586, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.404', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.200', 'weapon3': '1.450', 'weapon5': '2.182'} +[2023-09-14 12:50:36,782][102046] Sum rewards: 4.072, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.030', 'AMMO3': '0.042', 'WEAPON5': '0.100', 'AMMO4': '0.149', 'WEAPON4': '0.200', 'weapon2': '0.254', 'weapon5': '0.312', 'WEAPON3': '0.400', 'weapon4': '0.952', 'FRAGCOUNT': '1.000', 'weapon3': '1.228', 'DAMAGECOUNT': '1.500'} +[2023-09-14 12:50:38,388][101965] Updated weights for policy 0, policy_version 2325 (0.0013) +[2023-09-14 12:50:39,294][102001] DAMAGECOUNT value on done: 967.0 +[2023-09-14 12:50:39,294][102001] DAMAGECOUNT value on done: 1020.0 +[2023-09-14 12:50:39,577][109198] Fps is (10 sec: 14745.6, 60 sec: 14267.7, 300 sec: 14259.6). Total num frames: 15650816. Throughput: 0: 1733.7, 1: 1824.9. Samples: 1383824. Policy #0 lag: (min: 0.0, avg: 0.8, max: 2.0) +[2023-09-14 12:50:39,579][109198] Avg episode reward: [(0, '5.105'), (1, '3.581')] +[2023-09-14 12:50:39,585][101718] Saving new best policy, reward=5.105! +[2023-09-14 12:50:39,806][102001] DAMAGECOUNT value on done: 1710.0 +[2023-09-14 12:50:39,807][102001] DAMAGECOUNT value on done: 1397.0 +[2023-09-14 12:50:39,807][102001] Sum rewards: 5.051, reward structure: {'HEALTH': '-2.150', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.050', 'AMMO3': '0.060', 'WEAPON5': '0.100', 'weapon5': '0.136', 'WEAPON4': '0.200', 'weapon4': '0.482', 'WEAPON3': '0.600', 'weapon2': '1.158', 'weapon3': '1.800', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.600'} +[2023-09-14 12:50:39,808][102001] Sum rewards: 4.522, reward structure: {'HEALTH': '-2.600', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.065', 'WEAPON4': '0.100', 'weapon4': '0.204', 'WEAPON5': '0.300', 'weapon2': '0.384', 'WEAPON3': '0.600', 'weapon5': '1.230', 'FRAGCOUNT': '2.000', 'weapon3': '2.100', 'DAMAGECOUNT': '2.150'} +[2023-09-14 12:50:41,072][101964] Updated weights for policy 1, policy_version 1497 (0.0012) +[2023-09-14 12:50:41,360][102001] DAMAGECOUNT value on done: 3133.0 +[2023-09-14 12:50:41,360][102001] Sum rewards: 8.944, reward structure: {'HEALTH': '-2.550', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.006', 'AMMO5': '0.015', 'AMMO4': '0.031', 'AMMO3': '0.059', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.502', 'WEAPON3': '0.600', 'weapon2': '0.666', 'weapon5': '0.692', 'weapon3': '2.072', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.350'} +[2023-09-14 12:50:41,360][102001] DAMAGECOUNT value on done: 3585.0 +[2023-09-14 12:50:41,361][102001] Sum rewards: 2.144, reward structure: {'HEALTH': '-4.200', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.011', 'AMMO5': '0.020', 'AMMO4': '0.052', 'AMMO3': '0.103', 'weapon4': '0.272', 'WEAPON4': '0.300', 'weapon5': '0.320', 'WEAPON5': '0.400', 'weapon2': '0.548', 'WEAPON3': '0.900', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.650', 'weapon3': '2.768'} +[2023-09-14 12:50:42,068][102001] DAMAGECOUNT value on done: 1371.0 +[2023-09-14 12:50:42,068][102001] DAMAGECOUNT value on done: 1236.0 +[2023-09-14 12:50:42,069][102001] Sum rewards: 4.800, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.030', 'AMMO3': '0.040', 'AMMO4': '0.150', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.354', 'WEAPON3': '0.400', 'weapon4': '0.728', 'FRAGCOUNT': '1.000', 'weapon3': '1.328', 'weapon5': '1.360', 'DAMAGECOUNT': '1.500'} +[2023-09-14 12:50:42,069][102001] Sum rewards: 3.685, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.014', 'AMMO4': '0.025', 'AMMO3': '0.075', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon2': '0.408', 'weapon4': '0.418', 'WEAPON3': '0.600', 'FRAGCOUNT': '0.999', 'weapon3': '1.494', 'DAMAGECOUNT': '1.550', 'weapon5': '1.596'} +[2023-09-14 12:50:43,567][101965] Updated weights for policy 0, policy_version 2335 (0.0014) +[2023-09-14 12:50:44,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14267.8, 300 sec: 14259.6). Total num frames: 15720448. Throughput: 0: 1762.5, 1: 1808.0. Samples: 1405311. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:50:44,579][109198] Avg episode reward: [(0, '5.074'), (1, '3.631')] +[2023-09-14 12:50:47,477][101964] Updated weights for policy 1, policy_version 1507 (0.0018) +[2023-09-14 12:50:49,452][101965] Updated weights for policy 0, policy_version 2345 (0.0013) +[2023-09-14 12:50:49,577][109198] Fps is (10 sec: 13926.5, 60 sec: 14267.8, 300 sec: 14273.5). Total num frames: 15790080. Throughput: 0: 1767.9, 1: 1784.8. Samples: 1415564. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:50:49,579][109198] Avg episode reward: [(0, '5.074'), (1, '3.631')] +[2023-09-14 12:50:51,286][102037] DAMAGECOUNT value on done: 2575.0 +[2023-09-14 12:50:51,286][102037] DAMAGECOUNT value on done: 3106.0 +[2023-09-14 12:50:51,286][102037] Sum rewards: 5.281, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO5': '0.015', 'weapon2': '0.046', 'AMMO4': '0.050', 'AMMO3': '0.078', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.610', 'WEAPON3': '0.700', 'weapon5': '1.148', 'weapon3': '2.124', 'DAMAGECOUNT': '3.000', 'FRAGCOUNT': '3.000'} +[2023-09-14 12:50:51,287][102037] Sum rewards: 5.636, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.017', 'AMMO5': '0.020', 'AMMO3': '0.075', 'AMMO4': '0.087', 'weapon2': '0.134', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'weapon4': '0.440', 'WEAPON3': '0.700', 'weapon5': '0.990', 'weapon3': '2.372', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.200'} +[2023-09-14 12:50:51,945][102037] DAMAGECOUNT value on done: 1337.0 +[2023-09-14 12:50:51,945][102037] DAMAGECOUNT value on done: 1310.0 +[2023-09-14 12:50:51,946][102037] Sum rewards: 4.460, reward structure: {'HEALTH': '-0.850', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.035', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.174', 'WEAPON3': '0.200', 'weapon3': '0.632', 'weapon5': '0.808', 'weapon4': '0.886', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.350'} +[2023-09-14 12:50:52,190][102037] DAMAGECOUNT value on done: 2770.0 +[2023-09-14 12:50:52,190][102037] DAMAGECOUNT value on done: 2716.0 +[2023-09-14 12:50:52,191][102037] Sum rewards: 3.981, reward structure: {'HEALTH': '-0.800', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'AMMO2': '0.025', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.125', 'WEAPON3': '0.200', 'weapon2': '0.310', 'weapon3': '0.604', 'weapon5': '0.604', 'weapon4': '0.630', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.060'} +[2023-09-14 12:50:52,475][102005] DAMAGECOUNT value on done: 1395.0 +[2023-09-14 12:50:52,475][102005] DAMAGECOUNT value on done: 1328.0 +[2023-09-14 12:50:52,476][102005] Sum rewards: 2.903, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.025', 'AMMO3': '0.039', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.312', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '1.310', 'weapon5': '2.402'} +[2023-09-14 12:50:52,476][102005] Sum rewards: 6.644, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.027', 'AMMO3': '0.030', 'weapon2': '0.048', 'AMMO4': '0.136', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.844', 'weapon3': '1.060', 'weapon5': '1.888', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.000'} +[2023-09-14 12:50:52,803][102037] DAMAGECOUNT value on done: 1815.0 +[2023-09-14 12:50:52,803][102037] Sum rewards: 4.472, reward structure: {'HEALTH': '-3.900', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.020', 'AMMO4': '0.025', 'AMMO3': '0.096', 'WEAPON4': '0.100', 'weapon4': '0.210', 'weapon2': '0.380', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'weapon5': '0.834', 'weapon3': '2.502', 'DAMAGECOUNT': '3.000', 'FRAGCOUNT': '3.000'} +[2023-09-14 12:50:52,803][102037] DAMAGECOUNT value on done: 1969.0 +[2023-09-14 12:50:52,804][102037] Sum rewards: 6.365, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.020', 'AMMO4': '0.021', 'AMMO3': '0.096', 'WEAPON4': '0.200', 'weapon4': '0.238', 'weapon2': '0.350', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'weapon5': '0.928', 'weapon3': '2.408', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.900'} +[2023-09-14 12:50:53,141][102005] DAMAGECOUNT value on done: 1999.0 +[2023-09-14 12:50:53,141][102005] DAMAGECOUNT value on done: 2194.0 +[2023-09-14 12:50:53,142][102005] Sum rewards: 6.061, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.012', 'AMMO3': '0.037', 'AMMO4': '0.060', 'weapon2': '0.166', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.328', 'weapon3': '0.744', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '2.350', 'weapon5': '2.804'} +[2023-09-14 12:50:53,142][102005] Sum rewards: 2.418, reward structure: {'HEALTH': '-2.850', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.008', 'AMMO5': '0.014', 'AMMO4': '0.041', 'weapon4': '0.046', 'AMMO3': '0.069', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.696', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.150', 'weapon3': '1.556', 'weapon5': '1.688'} +[2023-09-14 12:50:53,985][101964] Updated weights for policy 1, policy_version 1517 (0.0014) +[2023-09-14 12:50:54,577][109198] Fps is (10 sec: 13107.1, 60 sec: 14062.9, 300 sec: 14245.7). Total num frames: 15851520. Throughput: 0: 1777.4, 1: 1741.5. Samples: 1435307. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:50:54,579][109198] Avg episode reward: [(0, '5.009'), (1, '3.678')] +[2023-09-14 12:50:55,168][101965] Updated weights for policy 0, policy_version 2355 (0.0013) +[2023-09-14 12:50:55,643][102040] DAMAGECOUNT value on done: 1040.0 +[2023-09-14 12:50:55,644][102040] DAMAGECOUNT value on done: 1388.0 +[2023-09-14 12:50:56,220][102040] DAMAGECOUNT value on done: 1283.0 +[2023-09-14 12:50:56,222][102040] Sum rewards: 4.803, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'AMMO2': '0.022', 'AMMO3': '0.071', 'AMMO4': '0.108', 'weapon2': '0.160', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'weapon5': '0.334', 'weapon4': '0.550', 'WEAPON3': '0.600', 'weapon3': '1.766', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.580'} +[2023-09-14 12:50:56,222][102040] DAMAGECOUNT value on done: 1023.0 +[2023-09-14 12:50:56,225][102040] Sum rewards: 4.033, reward structure: {'HEALTH': '-3.750', 'DEATHCOUNT': '-3.000', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.017', 'AMMO3': '0.097', 'weapon2': '0.126', 'WEAPON4': '0.200', 'weapon5': '0.308', 'WEAPON5': '0.400', 'weapon4': '0.432', 'WEAPON3': '0.800', 'weapon3': '2.358', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.050'} +[2023-09-14 12:50:57,121][102005] DAMAGECOUNT value on done: 1483.0 +[2023-09-14 12:50:57,121][102005] DAMAGECOUNT value on done: 1408.0 +[2023-09-14 12:50:57,122][102005] Sum rewards: 4.311, reward structure: {'HEALTH': '-1.800', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.009', 'AMMO4': '0.024', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.354', 'WEAPON3': '0.400', 'weapon2': '0.516', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.300', 'weapon3': '1.452', 'weapon5': '1.712'} +[2023-09-14 12:50:57,801][102005] DAMAGECOUNT value on done: 3415.0 +[2023-09-14 12:50:57,801][102005] DAMAGECOUNT value on done: 3385.0 +[2023-09-14 12:50:57,802][102005] Sum rewards: 5.913, reward structure: {'HEALTH': '-0.250', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.030', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.150', 'WEAPON3': '0.200', 'weapon3': '0.532', 'weapon4': '0.592', 'FRAGCOUNT': '1.000', 'weapon5': '1.584', 'DAMAGECOUNT': '1.850'} +[2023-09-14 12:50:58,130][102004] DAMAGECOUNT value on done: 2436.0 +[2023-09-14 12:50:58,131][102004] Sum rewards: 3.214, reward structure: {'HEALTH': '-3.100', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.021', 'AMMO3': '0.077', 'AMMO4': '0.104', 'WEAPON4': '0.300', 'weapon4': '0.310', 'weapon5': '0.374', 'WEAPON5': '0.400', 'weapon2': '0.402', 'WEAPON3': '0.700', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.100', 'weapon3': '2.506'} +[2023-09-14 12:50:58,131][102004] DAMAGECOUNT value on done: 2837.0 +[2023-09-14 12:50:58,131][102004] Sum rewards: 6.980, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.013', 'AMMO3': '0.050', 'AMMO4': '0.065', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'weapon2': '0.592', 'weapon4': '0.642', 'weapon5': '0.762', 'weapon3': '1.646', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.300'} +[2023-09-14 12:50:58,704][102004] DAMAGECOUNT value on done: 2773.0 +[2023-09-14 12:50:58,705][102004] DAMAGECOUNT value on done: 2431.0 +[2023-09-14 12:50:58,705][102004] Sum rewards: 8.927, reward structure: {'HEALTH': '-6.250', 'DEATHCOUNT': '-6.000', 'HITCOUNT': '0.000', 'AMMO5': '0.035', 'AMMO2': '0.052', 'weapon2': '0.102', 'AMMO3': '0.143', 'AMMO4': '0.259', 'weapon4': '0.430', 'weapon5': '0.474', 'WEAPON4': '0.500', 'WEAPON5': '0.700', 'WEAPON3': '1.100', 'weapon3': '2.832', 'FRAGCOUNT': '7.000', 'DAMAGECOUNT': '7.550'} +[2023-09-14 12:50:58,706][102004] Sum rewards: 4.702, reward structure: {'HEALTH': '-7.300', 'DEATHCOUNT': '-7.000', 'HITCOUNT': '0.000', 'AMMO2': '0.016', 'AMMO5': '0.035', 'AMMO4': '0.081', 'weapon2': '0.104', 'AMMO3': '0.197', 'weapon5': '0.458', 'WEAPON4': '0.500', 'WEAPON5': '0.700', 'weapon4': '0.756', 'WEAPON3': '1.300', 'weapon3': '2.354', 'FRAGCOUNT': '6.000', 'DAMAGECOUNT': '6.500'} +[2023-09-14 12:50:59,577][109198] Fps is (10 sec: 13516.7, 60 sec: 14199.5, 300 sec: 14245.7). Total num frames: 15925248. Throughput: 0: 1791.6, 1: 1706.7. Samples: 1455875. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:50:59,579][109198] Avg episode reward: [(0, '4.982'), (1, '3.804')] +[2023-09-14 12:51:00,012][102040] DAMAGECOUNT value on done: 1586.0 +[2023-09-14 12:51:00,013][102040] DAMAGECOUNT value on done: 1239.0 +[2023-09-14 12:51:00,013][102040] Sum rewards: 5.879, reward structure: {'HEALTH': '-0.650', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.102', 'WEAPON3': '0.200', 'weapon2': '0.350', 'weapon3': '0.768', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon5': '2.834'} +[2023-09-14 12:51:00,161][101964] Updated weights for policy 1, policy_version 1527 (0.0013) +[2023-09-14 12:51:00,586][102040] DAMAGECOUNT value on done: 2790.0 +[2023-09-14 12:51:00,586][102040] DAMAGECOUNT value on done: 2612.0 +[2023-09-14 12:51:00,587][102040] Sum rewards: 6.084, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.010', 'AMMO3': '0.040', 'AMMO4': '0.050', 'weapon2': '0.164', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.568', 'weapon5': '1.102', 'weapon3': '1.324', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.070'} +[2023-09-14 12:51:00,753][101965] Updated weights for policy 0, policy_version 2365 (0.0012) +[2023-09-14 12:51:04,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14062.9, 300 sec: 14245.7). Total num frames: 15994880. Throughput: 0: 1811.0, 1: 1697.5. Samples: 1466890. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:51:04,579][109198] Avg episode reward: [(0, '4.987'), (1, '3.783')] +[2023-09-14 12:51:06,402][101964] Updated weights for policy 1, policy_version 1537 (0.0012) +[2023-09-14 12:51:06,414][101965] Updated weights for policy 0, policy_version 2375 (0.0012) +[2023-09-14 12:51:09,577][109198] Fps is (10 sec: 13926.4, 60 sec: 14062.9, 300 sec: 14231.9). Total num frames: 16064512. Throughput: 0: 1823.4, 1: 1683.7. Samples: 1487827. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:51:09,579][109198] Avg episode reward: [(0, '4.987'), (1, '3.783')] +[2023-09-14 12:51:10,723][102004] DAMAGECOUNT value on done: 2899.0 +[2023-09-14 12:51:10,723][102004] DAMAGECOUNT value on done: 2458.0 +[2023-09-14 12:51:10,724][102004] Sum rewards: 5.879, reward structure: {'HEALTH': '-0.580', 'AMMO4': '-0.000', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.168', 'WEAPON3': '0.200', 'weapon2': '0.218', 'weapon3': '0.708', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.340', 'weapon5': '2.600'} +[2023-09-14 12:51:11,478][102004] DAMAGECOUNT value on done: 2820.0 +[2023-09-14 12:51:11,478][102004] DAMAGECOUNT value on done: 2530.0 +[2023-09-14 12:51:11,614][102046] DAMAGECOUNT value on done: 1277.0 +[2023-09-14 12:51:11,614][102046] DAMAGECOUNT value on done: 1211.0 +[2023-09-14 12:51:11,615][102046] Sum rewards: 5.987, reward structure: {'HEALTH': '-0.550', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.020', 'AMMO4': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon2': '0.122', 'WEAPON3': '0.200', 'weapon4': '0.550', 'weapon3': '0.602', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.000', 'weapon5': '2.718'} +[2023-09-14 12:51:11,749][101965] Updated weights for policy 0, policy_version 2385 (0.0012) +[2023-09-14 12:51:12,275][101964] Updated weights for policy 1, policy_version 1547 (0.0012) +[2023-09-14 12:51:12,357][102046] DAMAGECOUNT value on done: 1320.0 +[2023-09-14 12:51:12,357][102046] DAMAGECOUNT value on done: 1795.0 +[2023-09-14 12:51:13,605][102046] DAMAGECOUNT value on done: 1530.0 +[2023-09-14 12:51:13,605][102046] DAMAGECOUNT value on done: 1670.0 +[2023-09-14 12:51:13,606][102046] Sum rewards: 3.641, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.019', 'AMMO3': '0.060', 'AMMO4': '0.096', 'weapon4': '0.184', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon5': '0.476', 'WEAPON3': '0.600', 'weapon2': '0.912', 'FRAGCOUNT': '2.000', 'weapon3': '2.278', 'DAMAGECOUNT': '2.500'} +[2023-09-14 12:51:13,606][102046] Sum rewards: 4.753, reward structure: {'HEALTH': '-3.450', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.014', 'AMMO5': '0.017', 'AMMO4': '0.069', 'AMMO3': '0.100', 'WEAPON4': '0.300', 'weapon2': '0.394', 'WEAPON5': '0.400', 'weapon4': '0.422', 'weapon5': '0.492', 'WEAPON3': '0.800', 'weapon3': '2.096', 'FRAGCOUNT': '2.999', 'DAMAGECOUNT': '3.100'} +[2023-09-14 12:51:13,757][102039] DAMAGECOUNT value on done: 1302.0 +[2023-09-14 12:51:13,758][102039] DAMAGECOUNT value on done: 1014.0 +[2023-09-14 12:51:13,758][102039] Sum rewards: 3.624, reward structure: {'HEALTH': '-0.590', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO3': '0.020', 'weapon2': '0.022', 'AMMO4': '0.024', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.302', 'weapon3': '0.668', 'weapon5': '0.700', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.070'} +[2023-09-14 12:51:13,936][102003] DAMAGECOUNT value on done: 2770.0 +[2023-09-14 12:51:13,937][102003] Sum rewards: 3.737, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO4': '0.000', 'AMMO5': '0.018', 'AMMO3': '0.097', 'WEAPON4': '0.300', 'weapon2': '0.394', 'WEAPON5': '0.400', 'weapon5': '0.474', 'weapon4': '0.596', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.999', 'weapon3': '2.208', 'DAMAGECOUNT': '2.450'} +[2023-09-14 12:51:13,937][102003] DAMAGECOUNT value on done: 2505.0 +[2023-09-14 12:51:13,937][102003] Sum rewards: 4.804, reward structure: {'HEALTH': '-2.450', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.013', 'AMMO5': '0.015', 'AMMO3': '0.053', 'AMMO4': '0.066', 'WEAPON4': '0.200', 'weapon4': '0.252', 'WEAPON5': '0.300', 'WEAPON3': '0.500', 'weapon5': '0.976', 'weapon2': '1.010', 'weapon3': '1.668', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.200'} +[2023-09-14 12:51:14,180][102046] DAMAGECOUNT value on done: 1711.0 +[2023-09-14 12:51:14,181][102046] Sum rewards: 5.297, reward structure: {'HEALTH': '-0.300', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.010', 'weapon2': '0.018', 'AMMO2': '0.020', 'AMMO4': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.100', 'WEAPON5': '0.100', 'weapon3': '0.382', 'weapon4': '0.608', 'weapon5': '0.856', 'DAMAGECOUNT': '1.300', 'FRAGCOUNT': '2.000'} +[2023-09-14 12:51:14,181][102046] DAMAGECOUNT value on done: 2090.0 +[2023-09-14 12:51:14,431][102039] DAMAGECOUNT value on done: 1978.0 +[2023-09-14 12:51:14,431][102039] DAMAGECOUNT value on done: 2272.0 +[2023-09-14 12:51:14,432][102039] Sum rewards: 6.998, reward structure: {'HEALTH': '-1.350', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '1.056', 'weapon3': '1.430', 'weapon5': '1.542', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.700'} +[2023-09-14 12:51:14,432][102039] Sum rewards: 2.736, reward structure: {'HEALTH': '-2.650', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.015', 'weapon2': '0.042', 'AMMO3': '0.063', 'WEAPON4': '0.100', 'weapon4': '0.212', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.350', 'weapon5': '1.578', 'weapon3': '2.126'} +[2023-09-14 12:51:14,543][102003] DAMAGECOUNT value on done: 1485.0 +[2023-09-14 12:51:14,543][102003] DAMAGECOUNT value on done: 1534.0 +[2023-09-14 12:51:14,544][102003] Sum rewards: 3.901, reward structure: {'HEALTH': '-1.540', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.045', 'WEAPON4': '0.100', 'weapon4': '0.198', 'WEAPON5': '0.200', 'weapon2': '0.388', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.198', 'weapon5': '1.882'} +[2023-09-14 12:51:14,544][102003] Sum rewards: 5.168, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.030', 'AMMO3': '0.049', 'WEAPON5': '0.100', 'AMMO4': '0.150', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.450', 'weapon4': '0.882', 'FRAGCOUNT': '1.000', 'weapon3': '1.050', 'weapon5': '1.214', 'DAMAGECOUNT': '1.640'} +[2023-09-14 12:51:14,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14131.2, 300 sec: 14245.7). Total num frames: 16138240. Throughput: 0: 1846.0, 1: 1663.9. Samples: 1509657. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:51:14,579][109198] Avg episode reward: [(0, '4.894'), (1, '3.827')] +[2023-09-14 12:51:15,103][102003] DAMAGECOUNT value on done: 1862.0 +[2023-09-14 12:51:15,103][102003] DAMAGECOUNT value on done: 1313.0 +[2023-09-14 12:51:15,626][102039] DAMAGECOUNT value on done: 1790.0 +[2023-09-14 12:51:15,626][102039] DAMAGECOUNT value on done: 1113.0 +[2023-09-14 12:51:15,682][102003] DAMAGECOUNT value on done: 1589.0 +[2023-09-14 12:51:15,682][102003] DAMAGECOUNT value on done: 1411.0 +[2023-09-14 12:51:16,160][102039] DAMAGECOUNT value on done: 1421.0 +[2023-09-14 12:51:16,160][102039] DAMAGECOUNT value on done: 1470.0 +[2023-09-14 12:51:16,160][102039] Sum rewards: 4.352, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.025', 'AMMO3': '0.030', 'WEAPON5': '0.100', 'AMMO4': '0.124', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon2': '0.302', 'weapon4': '0.816', 'weapon3': '0.854', 'DAMAGECOUNT': '0.950', 'FRAGCOUNT': '1.000', 'weapon5': '1.646'} +[2023-09-14 12:51:16,161][102039] Sum rewards: 3.571, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.043', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.710', 'weapon5': '0.880', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon3': '1.280'} +[2023-09-14 12:51:17,004][101965] Updated weights for policy 0, policy_version 2395 (0.0012) +[2023-09-14 12:51:18,312][101964] Updated weights for policy 1, policy_version 1557 (0.0013) +[2023-09-14 12:51:18,674][102001] DAMAGECOUNT value on done: 3258.0 +[2023-09-14 12:51:18,674][102001] DAMAGECOUNT value on done: 3710.0 +[2023-09-14 12:51:18,675][102001] Sum rewards: 4.731, reward structure: {'HEALTH': '-1.200', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO5': '0.005', 'AMMO2': '0.015', 'AMMO3': '0.040', 'AMMO4': '0.075', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.694', 'FRAGCOUNT': '1.000', 'weapon3': '1.220', 'DAMAGECOUNT': '1.250', 'weapon5': '1.930'} +[2023-09-14 12:51:18,675][102001] Sum rewards: 3.767, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'AMMO2': '0.037', 'AMMO3': '0.084', 'AMMO4': '0.184', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'WEAPON3': '0.600', 'weapon4': '0.664', 'FRAGCOUNT': '0.999', 'weapon3': '1.178', 'DAMAGECOUNT': '1.250', 'weapon5': '2.158'} +[2023-09-14 12:51:19,175][102001] DAMAGECOUNT value on done: 1581.0 +[2023-09-14 12:51:19,175][102001] Sum rewards: 5.469, reward structure: {'HEALTH': '-1.500', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.015', 'AMMO3': '0.040', 'AMMO4': '0.075', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.508', 'weapon4': '0.558', 'FRAGCOUNT': '1.000', 'weapon3': '1.148', 'weapon5': '1.716', 'DAMAGECOUNT': '2.100'} +[2023-09-14 12:51:19,176][102001] DAMAGECOUNT value on done: 1366.0 +[2023-09-14 12:51:19,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14131.2, 300 sec: 14259.6). Total num frames: 16207872. Throughput: 0: 1860.8, 1: 1658.0. Samples: 1520363. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:51:19,579][109198] Avg episode reward: [(0, '4.873'), (1, '3.891')] +[2023-09-14 12:51:20,319][102001] DAMAGECOUNT value on done: 1135.0 +[2023-09-14 12:51:20,319][102001] DAMAGECOUNT value on done: 1082.0 +[2023-09-14 12:51:20,319][102001] Sum rewards: 4.413, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.015', 'AMMO3': '0.047', 'AMMO4': '0.075', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.424', 'weapon4': '0.590', 'FRAGCOUNT': '1.000', 'weapon3': '1.026', 'DAMAGECOUNT': '1.150', 'weapon5': '1.428'} +[2023-09-14 12:51:20,320][102001] Sum rewards: 4.989, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.020', 'AMMO3': '0.040', 'AMMO4': '0.099', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon2': '0.202', 'WEAPON3': '0.400', 'weapon4': '0.758', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon3': '1.184', 'weapon5': '1.776'} +[2023-09-14 12:51:20,940][102001] DAMAGECOUNT value on done: 1772.0 +[2023-09-14 12:51:20,940][102001] DAMAGECOUNT value on done: 1935.0 +[2023-09-14 12:51:20,941][102001] Sum rewards: 7.650, reward structure: {'HEALTH': '-2.150', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'weapon4': '0.032', 'AMMO3': '0.065', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.730', 'weapon5': '1.132', 'weapon3': '2.082', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.750'} +[2023-09-14 12:51:20,941][102001] Sum rewards: 2.734, reward structure: {'HEALTH': '-3.750', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.012', 'AMMO5': '0.015', 'AMMO4': '0.059', 'weapon4': '0.078', 'AMMO3': '0.088', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'weapon2': '0.368', 'WEAPON3': '0.700', 'weapon5': '1.398', 'FRAGCOUNT': '2.000', 'weapon3': '2.116', 'DAMAGECOUNT': '2.250'} +[2023-09-14 12:51:22,567][101965] Updated weights for policy 0, policy_version 2405 (0.0013) +[2023-09-14 12:51:24,495][101964] Updated weights for policy 1, policy_version 1567 (0.0012) +[2023-09-14 12:51:24,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14131.2, 300 sec: 14273.5). Total num frames: 16281600. Throughput: 0: 1852.4, 1: 1650.7. Samples: 1541463. Policy #0 lag: (min: 0.0, avg: 0.7, max: 3.0) +[2023-09-14 12:51:24,579][109198] Avg episode reward: [(0, '4.900'), (1, '3.970')] +[2023-09-14 12:51:24,581][101802] Saving new best policy, reward=3.970! +[2023-09-14 12:51:28,293][101965] Updated weights for policy 0, policy_version 2415 (0.0012) +[2023-09-14 12:51:28,951][102037] DAMAGECOUNT value on done: 3211.0 +[2023-09-14 12:51:28,951][102037] DAMAGECOUNT value on done: 2690.0 +[2023-09-14 12:51:28,952][102037] Sum rewards: 2.711, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.009', 'AMMO4': '0.027', 'AMMO3': '0.067', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.298', 'WEAPON3': '0.500', 'weapon2': '0.732', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '1.192', 'weapon5': '1.532'} +[2023-09-14 12:51:28,952][102037] Sum rewards: 4.658, reward structure: {'HEALTH': '-1.050', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.714', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.150', 'weapon5': '1.624', 'weapon3': '1.630'} +[2023-09-14 12:51:29,531][102037] DAMAGECOUNT value on done: 1355.0 +[2023-09-14 12:51:29,532][102037] DAMAGECOUNT value on done: 1345.0 +[2023-09-14 12:51:29,577][109198] Fps is (10 sec: 14336.0, 60 sec: 14131.2, 300 sec: 14245.8). Total num frames: 16351232. Throughput: 0: 1836.9, 1: 1655.2. Samples: 1562453. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:51:29,579][109198] Avg episode reward: [(0, '4.835'), (1, '3.994')] +[2023-09-14 12:51:29,586][101802] Saving new best policy, reward=3.994! +[2023-09-14 12:51:29,706][102037] DAMAGECOUNT value on done: 2776.0 +[2023-09-14 12:51:29,706][102037] DAMAGECOUNT value on done: 2855.0 +[2023-09-14 12:51:29,909][102005] DAMAGECOUNT value on done: 1328.0 +[2023-09-14 12:51:29,909][102005] DAMAGECOUNT value on done: 1565.0 +[2023-09-14 12:51:29,910][102005] Sum rewards: 5.577, reward structure: {'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'AMMO2': '0.030', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.150', 'WEAPON3': '0.200', 'weapon3': '0.592', 'weapon4': '0.782', 'weapon5': '0.898', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.700'} +[2023-09-14 12:51:30,289][102037] DAMAGECOUNT value on done: 2113.0 +[2023-09-14 12:51:30,289][102037] DAMAGECOUNT value on done: 2116.0 +[2023-09-14 12:51:30,290][102037] Sum rewards: 6.674, reward structure: {'HEALTH': '-1.600', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.024', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon2': '0.348', 'WEAPON3': '0.400', 'weapon4': '0.404', 'weapon5': '1.212', 'weapon3': '1.554', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.980'} +[2023-09-14 12:51:30,290][102037] Sum rewards: 1.772, reward structure: {'HEALTH': '-2.180', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.008', 'AMMO5': '0.012', 'AMMO4': '0.038', 'AMMO3': '0.075', 'weapon2': '0.086', 'weapon5': '0.124', 'WEAPON4': '0.200', 'weapon4': '0.256', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.470', 'weapon3': '1.782'} +[2023-09-14 12:51:30,509][102005] DAMAGECOUNT value on done: 2444.0 +[2023-09-14 12:51:30,509][102005] DAMAGECOUNT value on done: 2704.0 +[2023-09-14 12:51:30,510][102005] Sum rewards: 7.323, reward structure: {'HEALTH': '-4.250', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO2': '0.021', 'AMMO3': '0.097', 'AMMO4': '0.102', 'weapon2': '0.210', 'WEAPON5': '0.300', 'WEAPON4': '0.400', 'weapon5': '0.502', 'weapon4': '0.594', 'WEAPON3': '0.800', 'weapon3': '2.432', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.100'} +[2023-09-14 12:51:30,509][102005] Sum rewards: 4.155, reward structure: {'HEALTH': '-5.290', 'DEATHCOUNT': '-5.000', 'HITCOUNT': '0.000', 'AMMO2': '0.012', 'AMMO5': '0.028', 'AMMO4': '0.062', 'AMMO3': '0.149', 'WEAPON4': '0.200', 'weapon4': '0.286', 'weapon2': '0.352', 'weapon5': '0.462', 'WEAPON5': '0.600', 'WEAPON3': '1.100', 'weapon3': '2.744', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.450'} +[2023-09-14 12:51:30,737][101964] Updated weights for policy 1, policy_version 1577 (0.0013) +[2023-09-14 12:51:33,398][102040] DAMAGECOUNT value on done: 1548.0 +[2023-09-14 12:51:33,399][102040] Sum rewards: 4.485, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.026', 'AMMO3': '0.055', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.372', 'WEAPON3': '0.400', 'weapon5': '0.416', 'weapon2': '0.468', 'weapon3': '0.832', 'DAMAGECOUNT': '1.600', 'FRAGCOUNT': '2.000'} +[2023-09-14 12:51:33,398][102040] DAMAGECOUNT value on done: 1150.0 +[2023-09-14 12:51:33,400][102040] Sum rewards: 1.850, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO3': '0.040', 'WEAPON4': '0.100', 'weapon4': '0.194', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.480', 'weapon5': '0.728', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon3': '1.630'} +[2023-09-14 12:51:33,833][101965] Updated weights for policy 0, policy_version 2425 (0.0013) +[2023-09-14 12:51:33,926][102040] DAMAGECOUNT value on done: 1503.0 +[2023-09-14 12:51:33,927][102040] DAMAGECOUNT value on done: 1423.0 +[2023-09-14 12:51:33,927][102040] Sum rewards: 2.380, reward structure: {'HEALTH': '-3.950', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.015', 'AMMO4': '0.022', 'WEAPON4': '0.100', 'AMMO3': '0.102', 'weapon4': '0.196', 'WEAPON5': '0.300', 'weapon2': '0.442', 'WEAPON3': '0.800', 'weapon5': '0.920', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.200', 'weapon3': '2.228'} +[2023-09-14 12:51:33,928][102040] Sum rewards: 7.851, reward structure: {'HEALTH': '-2.100', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.049', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.060', 'WEAPON4': '0.100', 'weapon4': '0.194', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'weapon2': '0.760', 'weapon5': '0.778', 'weapon3': '2.202', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '4.000'} +[2023-09-14 12:51:34,475][102005] DAMAGECOUNT value on done: 1443.0 +[2023-09-14 12:51:34,475][102005] DAMAGECOUNT value on done: 1498.0 +[2023-09-14 12:51:34,577][109198] Fps is (10 sec: 13926.4, 60 sec: 14062.9, 300 sec: 14245.7). Total num frames: 16420864. Throughput: 0: 1833.0, 1: 1654.6. Samples: 1572509. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0) +[2023-09-14 12:51:34,579][109198] Avg episode reward: [(0, '4.791'), (1, '4.021')] +[2023-09-14 12:51:34,581][101802] Saving new best policy, reward=4.021! +[2023-09-14 12:51:35,053][102005] DAMAGECOUNT value on done: 3685.0 +[2023-09-14 12:51:35,053][102005] DAMAGECOUNT value on done: 3565.0 +[2023-09-14 12:51:35,054][102005] Sum rewards: 6.098, reward structure: {'HEALTH': '-2.050', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.014', 'AMMO2': '0.020', 'AMMO3': '0.050', 'weapon2': '0.056', 'AMMO4': '0.098', 'WEAPON4': '0.300', 'WEAPON5': '0.300', 'WEAPON3': '0.500', 'weapon5': '0.956', 'weapon4': '1.034', 'weapon3': '1.822', 'FRAGCOUNT': '1.998', 'DAMAGECOUNT': '3.000'} +[2023-09-14 12:51:36,352][102004] DAMAGECOUNT value on done: 3098.0 +[2023-09-14 12:51:36,353][102004] DAMAGECOUNT value on done: 2831.0 +[2023-09-14 12:51:36,353][102004] Sum rewards: 2.934, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.018', 'AMMO3': '0.057', 'AMMO4': '0.091', 'WEAPON5': '0.100', 'weapon2': '0.126', 'WEAPON4': '0.400', 'WEAPON3': '0.500', 'weapon5': '0.694', 'weapon4': '1.026', 'weapon3': '1.306', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.610'} +[2023-09-14 12:51:36,353][102004] Sum rewards: 5.792, reward structure: {'HEALTH': '-3.590', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'AMMO2': '0.015', 'weapon2': '0.054', 'AMMO4': '0.072', 'AMMO3': '0.081', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon4': '0.530', 'WEAPON3': '0.700', 'weapon5': '1.032', 'weapon3': '2.336', 'FRAGCOUNT': '2.999', 'DAMAGECOUNT': '3.950'} +[2023-09-14 12:51:36,738][101964] Updated weights for policy 1, policy_version 1587 (0.0014) +[2023-09-14 12:51:36,912][102004] DAMAGECOUNT value on done: 2946.0 +[2023-09-14 12:51:36,912][102004] DAMAGECOUNT value on done: 3258.0 +[2023-09-14 12:51:36,913][102004] Sum rewards: 7.393, reward structure: {'HEALTH': '-4.700', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.027', 'weapon2': '0.078', 'AMMO3': '0.129', 'AMMO4': '0.134', 'weapon5': '0.364', 'WEAPON4': '0.400', 'weapon4': '0.480', 'WEAPON5': '0.500', 'WEAPON3': '1.000', 'weapon3': '2.806', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.150'} +[2023-09-14 12:51:36,913][102004] Sum rewards: 5.328, reward structure: {'DEATHCOUNT': '-5.000', 'HEALTH': '-5.000', 'HITCOUNT': '0.000', 'AMMO2': '0.029', 'AMMO5': '0.030', 'AMMO4': '0.143', 'AMMO3': '0.160', 'weapon4': '0.188', 'weapon5': '0.220', 'weapon2': '0.336', 'WEAPON4': '0.400', 'WEAPON5': '0.600', 'WEAPON3': '1.200', 'weapon3': '3.172', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.850'} +[2023-09-14 12:51:37,478][102040] DAMAGECOUNT value on done: 1514.0 +[2023-09-14 12:51:37,478][102040] DAMAGECOUNT value on done: 1911.0 +[2023-09-14 12:51:37,479][102040] Sum rewards: 4.236, reward structure: {'HEALTH': '-3.150', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.024', 'AMMO3': '0.083', 'AMMO4': '0.118', 'weapon2': '0.248', 'weapon5': '0.294', 'WEAPON4': '0.300', 'weapon4': '0.370', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.750', 'weapon3': '2.978'} +[2023-09-14 12:51:37,479][102040] Sum rewards: 5.458, reward structure: {'HEALTH': '-2.600', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.005', 'AMMO4': '0.018', 'AMMO3': '0.058', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.336', 'WEAPON3': '0.500', 'weapon2': '0.724', 'weapon5': '0.764', 'weapon3': '1.198', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.250'} +[2023-09-14 12:51:38,136][102040] DAMAGECOUNT value on done: 2890.0 +[2023-09-14 12:51:38,136][102040] DAMAGECOUNT value on done: 2657.0 +[2023-09-14 12:51:39,577][109198] Fps is (10 sec: 13926.6, 60 sec: 13994.7, 300 sec: 14231.9). Total num frames: 16490496. Throughput: 0: 1851.5, 1: 1673.5. Samples: 1593933. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:51:39,579][101965] Updated weights for policy 0, policy_version 2435 (0.0013) +[2023-09-14 12:51:39,579][109198] Avg episode reward: [(0, '4.809'), (1, '3.976')] +[2023-09-14 12:51:42,848][101964] Updated weights for policy 1, policy_version 1597 (0.0014) +[2023-09-14 12:51:44,577][109198] Fps is (10 sec: 13926.5, 60 sec: 13994.7, 300 sec: 14245.7). Total num frames: 16560128. Throughput: 0: 1859.9, 1: 1681.4. Samples: 1615235. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:51:44,580][109198] Avg episode reward: [(0, '4.809'), (1, '3.976')] +[2023-09-14 12:51:45,011][101965] Updated weights for policy 0, policy_version 2445 (0.0013) +[2023-09-14 12:51:46,078][102046] DAMAGECOUNT value on done: 1416.0 +[2023-09-14 12:51:46,078][102046] DAMAGECOUNT value on done: 1457.0 +[2023-09-14 12:51:46,079][102046] Sum rewards: 5.865, reward structure: {'HEALTH': '-1.800', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.019', 'AMMO3': '0.040', 'AMMO4': '0.095', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.400', 'weapon4': '0.432', 'weapon2': '0.652', 'weapon3': '1.166', 'weapon5': '1.606', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.050'} +[2023-09-14 12:51:46,079][102046] Sum rewards: 3.358, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.020', 'AMMO3': '0.040', 'AMMO4': '0.098', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon2': '0.316', 'WEAPON3': '0.400', 'weapon4': '0.744', 'FRAGCOUNT': '1.000', 'weapon5': '1.198', 'weapon3': '1.232', 'DAMAGECOUNT': '1.800'} +[2023-09-14 12:51:46,640][102046] DAMAGECOUNT value on done: 1365.0 +[2023-09-14 12:51:46,640][102046] DAMAGECOUNT value on done: 1825.0 +[2023-09-14 12:51:48,884][102004] DAMAGECOUNT value on done: 3279.0 +[2023-09-14 12:51:48,884][102004] DAMAGECOUNT value on done: 2578.0 +[2023-09-14 12:51:48,885][102004] Sum rewards: 8.645, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.026', 'AMMO3': '0.039', 'weapon2': '0.074', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.128', 'WEAPON3': '0.400', 'weapon4': '0.668', 'weapon5': '1.098', 'weapon3': '1.356', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.800'} +[2023-09-14 12:51:48,885][102004] Sum rewards: 1.006, reward structure: {'HEALTH': '-3.650', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.019', 'AMMO5': '0.020', 'AMMO4': '0.096', 'AMMO3': '0.106', 'weapon2': '0.242', 'WEAPON4': '0.300', 'weapon4': '0.382', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'weapon5': '0.896', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.200', 'weapon3': '2.194'} +[2023-09-14 12:51:49,112][101964] Updated weights for policy 1, policy_version 1607 (0.0013) +[2023-09-14 12:51:49,477][102004] DAMAGECOUNT value on done: 2990.0 +[2023-09-14 12:51:49,478][102004] DAMAGECOUNT value on done: 2633.0 +[2023-09-14 12:51:49,478][102004] Sum rewards: 4.764, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.043', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.238', 'WEAPON3': '0.400', 'weapon2': '0.570', 'FRAGCOUNT': '1.000', 'weapon3': '1.176', 'weapon5': '1.432', 'DAMAGECOUNT': '1.700'} +[2023-09-14 12:51:49,479][102004] Sum rewards: 2.819, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.030', 'AMMO3': '0.044', 'AMMO4': '0.150', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.798', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.030', 'weapon3': '1.220', 'weapon5': '1.740'} +[2023-09-14 12:51:49,577][109198] Fps is (10 sec: 13926.2, 60 sec: 13994.6, 300 sec: 14245.7). Total num frames: 16629760. Throughput: 0: 1850.7, 1: 1673.6. Samples: 1625486. Policy #0 lag: (min: 0.0, avg: 0.5, max: 2.0) +[2023-09-14 12:51:49,579][109198] Avg episode reward: [(0, '4.783'), (1, '4.098')] +[2023-09-14 12:51:49,586][101718] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002453_10047488.pth... +[2023-09-14 12:51:49,586][101802] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001607_6582272.pth... +[2023-09-14 12:51:49,648][101802] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001204_4931584.pth +[2023-09-14 12:51:49,652][101718] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002022_8282112.pth +[2023-09-14 12:51:49,657][101802] Saving new best policy, reward=4.098! +[2023-09-14 12:51:50,495][101965] Updated weights for policy 0, policy_version 2455 (0.0012) +[2023-09-14 12:51:52,649][102046] DAMAGECOUNT value on done: 1996.0 +[2023-09-14 12:51:52,649][102046] DAMAGECOUNT value on done: 1990.0 +[2023-09-14 12:51:52,650][102046] Sum rewards: 7.168, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.019', 'AMMO4': '0.035', 'weapon2': '0.066', 'AMMO3': '0.095', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'weapon4': '0.666', 'weapon5': '0.746', 'WEAPON3': '0.800', 'weapon3': '2.432', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '4.600'} +[2023-09-14 12:51:52,650][102046] Sum rewards: 2.800, reward structure: {'HEALTH': '-4.000', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.012', 'AMMO5': '0.015', 'AMMO4': '0.058', 'AMMO3': '0.101', 'weapon4': '0.140', 'WEAPON4': '0.200', 'weapon5': '0.212', 'weapon2': '0.234', 'WEAPON5': '0.400', 'WEAPON3': '0.900', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '3.260', 'weapon3': '3.268'} +[2023-09-14 12:51:53,333][102046] DAMAGECOUNT value on done: 1830.0 +[2023-09-14 12:51:53,333][102046] DAMAGECOUNT value on done: 2180.0 +[2023-09-14 12:51:53,334][102046] Sum rewards: 4.933, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.030', 'AMMO3': '0.055', 'weapon2': '0.098', 'WEAPON4': '0.100', 'AMMO4': '0.150', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.780', 'weapon3': '0.782', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.190', 'weapon5': '2.140'} +[2023-09-14 12:51:53,334][102046] Sum rewards: 1.793, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.012', 'AMMO3': '0.066', 'WEAPON4': '0.100', 'weapon4': '0.206', 'WEAPON5': '0.300', 'weapon2': '0.382', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.900', 'weapon5': '1.018', 'weapon3': '2.240'} +[2023-09-14 12:51:53,593][102039] DAMAGECOUNT value on done: 1407.0 +[2023-09-14 12:51:53,594][102039] DAMAGECOUNT value on done: 1216.0 +[2023-09-14 12:51:53,594][102039] Sum rewards: 1.170, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.013', 'AMMO3': '0.077', 'weapon2': '0.112', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.416', 'WEAPON3': '0.700', 'weapon5': '0.844', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '2.464'} +[2023-09-14 12:51:53,595][102039] Sum rewards: 6.862, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.030', 'AMMO3': '0.040', 'AMMO4': '0.150', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.998', 'weapon3': '1.258', 'weapon5': '1.556', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.020'} +[2023-09-14 12:51:53,634][102003] DAMAGECOUNT value on done: 3030.0 +[2023-09-14 12:51:53,635][102003] DAMAGECOUNT value on done: 3170.0 +[2023-09-14 12:51:53,635][102003] Sum rewards: 7.904, reward structure: {'DEATHCOUNT': '-4.000', 'HEALTH': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.020', 'AMMO2': '0.024', 'AMMO4': '0.119', 'AMMO3': '0.119', 'weapon5': '0.288', 'WEAPON4': '0.300', 'weapon4': '0.388', 'WEAPON5': '0.400', 'weapon2': '0.744', 'WEAPON3': '0.900', 'weapon3': '2.352', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '5.250'} +[2023-09-14 12:51:53,636][102003] Sum rewards: 3.869, reward structure: {'HEALTH': '-5.100', 'DEATHCOUNT': '-5.000', 'HITCOUNT': '0.000', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.030', 'WEAPON4': '0.100', 'weapon4': '0.136', 'AMMO3': '0.152', 'weapon2': '0.156', 'weapon5': '0.194', 'WEAPON5': '0.600', 'WEAPON3': '1.200', 'weapon3': '3.388', 'DAMAGECOUNT': '4.000', 'FRAGCOUNT': '4.000'} +[2023-09-14 12:51:54,197][102039] DAMAGECOUNT value on done: 2422.0 +[2023-09-14 12:51:54,198][102039] Sum rewards: 4.191, reward structure: {'HEALTH': '-4.800', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.007', 'AMMO5': '0.020', 'AMMO4': '0.036', 'AMMO3': '0.110', 'weapon4': '0.168', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'weapon2': '0.424', 'weapon5': '0.482', 'WEAPON3': '0.900', 'weapon3': '2.804', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '4.440'} +[2023-09-14 12:51:54,197][102039] DAMAGECOUNT value on done: 2742.0 +[2023-09-14 12:51:54,199][102039] Sum rewards: 5.205, reward structure: {'HEALTH': '-4.000', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.013', 'AMMO5': '0.020', 'weapon4': '0.020', 'AMMO4': '0.065', 'WEAPON4': '0.100', 'AMMO3': '0.103', 'weapon5': '0.214', 'WEAPON5': '0.400', 'weapon2': '0.530', 'WEAPON3': '0.900', 'FRAGCOUNT': '3.000', 'weapon3': '3.140', 'DAMAGECOUNT': '4.700'} +[2023-09-14 12:51:54,244][102003] DAMAGECOUNT value on done: 1585.0 +[2023-09-14 12:51:54,244][102003] DAMAGECOUNT value on done: 1704.0 +[2023-09-14 12:51:54,258][102003] Sum rewards: 4.864, reward structure: {'DEATHCOUNT': '-1.000', 'HEALTH': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.032', 'AMMO3': '0.036', 'WEAPON5': '0.100', 'AMMO4': '0.160', 'WEAPON4': '0.200', 'weapon2': '0.202', 'WEAPON3': '0.300', 'weapon3': '0.738', 'weapon4': '0.934', 'FRAGCOUNT': '1.000', 'weapon5': '1.456', 'DAMAGECOUNT': '1.700'} +[2023-09-14 12:51:54,245][102003] Sum rewards: 4.006, reward structure: {'HEALTH': '-1.650', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.023', 'AMMO3': '0.046', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.464', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.000', 'weapon3': '1.414', 'weapon5': '2.094'} +[2023-09-14 12:51:54,577][109198] Fps is (10 sec: 13926.3, 60 sec: 14131.2, 300 sec: 14231.9). Total num frames: 16699392. Throughput: 0: 1853.0, 1: 1670.2. Samples: 1646372. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:51:54,579][109198] Avg episode reward: [(0, '4.677'), (1, '4.168')] +[2023-09-14 12:51:54,581][101802] Saving new best policy, reward=4.168! +[2023-09-14 12:51:54,797][102001] Large shaping reward 2.602 for [('FRAGCOUNT', 1.0, 1.0), ('HITCOUNT', 0.0, 1.0), ('DAMAGECOUNT', 1.6, 160.0), ('weapon5', 0.002)] +[2023-09-14 12:51:55,054][102003] DAMAGECOUNT value on done: 2080.0 +[2023-09-14 12:51:55,054][102003] DAMAGECOUNT value on done: 1633.0 +[2023-09-14 12:51:55,055][102003] Sum rewards: 6.976, reward structure: {'HEALTH': '-2.250', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.015', 'AMMO4': '0.018', 'AMMO3': '0.064', 'WEAPON4': '0.200', 'weapon4': '0.272', 'WEAPON5': '0.300', 'weapon2': '0.420', 'WEAPON3': '0.600', 'weapon5': '0.892', 'weapon3': '2.242', 'FRAGCOUNT': '2.999', 'DAMAGECOUNT': '3.200'} +[2023-09-14 12:51:55,055][102003] Sum rewards: 2.215, reward structure: {'HEALTH': '-3.150', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.000', 'AMMO4': '0.000', 'AMMO5': '0.008', 'weapon4': '0.022', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'WEAPON5': '0.200', 'weapon2': '0.718', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon5': '1.334', 'weapon3': '1.890', 'DAMAGECOUNT': '2.180'} +[2023-09-14 12:51:55,315][102001] DAMAGECOUNT value on done: 3730.0 +[2023-09-14 12:51:55,315][102001] DAMAGECOUNT value on done: 3363.0 +[2023-09-14 12:51:55,316][102001] Sum rewards: 5.422, reward structure: {'HEALTH': '-0.200', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.020', 'AMMO3': '0.020', 'AMMO4': '0.097', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon4': '0.302', 'weapon2': '0.370', 'weapon3': '0.586', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon5': '1.772'} +[2023-09-14 12:51:55,382][101964] Updated weights for policy 1, policy_version 1617 (0.0013) +[2023-09-14 12:51:55,520][102039] DAMAGECOUNT value on done: 2005.0 +[2023-09-14 12:51:55,520][102039] Sum rewards: 4.426, reward structure: {'HEALTH': '-2.850', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.009', 'AMMO5': '0.015', 'AMMO4': '0.046', 'AMMO3': '0.060', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.368', 'weapon2': '0.392', 'WEAPON3': '0.600', 'weapon5': '1.006', 'FRAGCOUNT': '2.000', 'weapon3': '2.130', 'DAMAGECOUNT': '2.150'} +[2023-09-14 12:51:55,521][102039] DAMAGECOUNT value on done: 1408.0 +[2023-09-14 12:51:55,521][102039] Sum rewards: 5.793, reward structure: {'DEATHCOUNT': '-2.000', 'HEALTH': '-2.000', 'HITCOUNT': '0.000', 'AMMO2': '0.010', 'AMMO5': '0.010', 'AMMO4': '0.047', 'AMMO3': '0.060', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.462', 'weapon2': '0.574', 'WEAPON3': '0.600', 'weapon5': '0.920', 'weapon3': '1.760', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.950'} +[2023-09-14 12:51:55,662][102003] DAMAGECOUNT value on done: 1899.0 +[2023-09-14 12:51:55,662][102003] DAMAGECOUNT value on done: 1696.0 +[2023-09-14 12:51:55,663][102003] Sum rewards: 5.632, reward structure: {'HEALTH': '-3.100', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.012', 'AMMO5': '0.019', 'AMMO4': '0.057', 'AMMO3': '0.092', 'weapon4': '0.294', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'weapon2': '0.416', 'weapon5': '0.546', 'WEAPON3': '0.800', 'weapon3': '2.696', 'FRAGCOUNT': '2.999', 'DAMAGECOUNT': '3.100'} +[2023-09-14 12:51:55,663][102003] Sum rewards: 2.848, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'weapon2': '0.016', 'AMMO2': '0.018', 'AMMO4': '0.087', 'AMMO3': '0.093', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon5': '0.458', 'weapon4': '0.674', 'WEAPON3': '0.700', 'weapon3': '1.542', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.850'} +[2023-09-14 12:51:55,824][102001] DAMAGECOUNT value on done: 1466.0 +[2023-09-14 12:51:55,825][102001] Sum rewards: 3.971, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.009', 'AMMO3': '0.040', 'AMMO4': '0.045', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.294', 'WEAPON3': '0.400', 'weapon2': '0.414', 'DAMAGECOUNT': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.138', 'weapon5': '1.426'} +[2023-09-14 12:51:55,825][102001] DAMAGECOUNT value on done: 1694.0 +[2023-09-14 12:51:55,826][102001] Sum rewards: 3.751, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.025', 'AMMO3': '0.030', 'WEAPON5': '0.100', 'weapon2': '0.116', 'AMMO4': '0.125', 'WEAPON4': '0.200', 'WEAPON3': '0.300', 'weapon4': '0.866', 'weapon5': '0.912', 'weapon3': '0.942', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.130'} +[2023-09-14 12:51:56,219][101965] Updated weights for policy 0, policy_version 2465 (0.0014) +[2023-09-14 12:51:56,230][102039] DAMAGECOUNT value on done: 1448.0 +[2023-09-14 12:51:56,231][102039] Sum rewards: 0.016, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO2': '0.013', 'AMMO4': '0.066', 'AMMO3': '0.069', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.270', 'WEAPON4': '0.300', 'weapon2': '0.346', 'WEAPON3': '0.500', 'weapon5': '0.598', 'weapon4': '0.644', 'weapon3': '1.002'} +[2023-09-14 12:51:56,231][102039] DAMAGECOUNT value on done: 1575.0 +[2023-09-14 12:51:56,232][102039] Sum rewards: 3.637, reward structure: {'HEALTH': '-1.880', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.050', 'AMMO2': '-0.010', 'HITCOUNT': '0.000', 'AMMO5': '0.006', 'AMMO3': '0.040', 'WEAPON5': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.754', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.050', 'weapon3': '1.564', 'weapon5': '1.564'} +[2023-09-14 12:51:59,577][109198] Fps is (10 sec: 13516.8, 60 sec: 13994.7, 300 sec: 14204.1). Total num frames: 16764928. Throughput: 0: 1829.6, 1: 1653.3. Samples: 1666387. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:51:59,579][109198] Avg episode reward: [(0, '4.648'), (1, '4.152')] +[2023-09-14 12:52:01,236][102001] DAMAGECOUNT value on done: 1202.0 +[2023-09-14 12:52:01,236][102001] DAMAGECOUNT value on done: 1640.0 +[2023-09-14 12:52:01,237][102001] Sum rewards: 10.475, reward structure: {'HEALTH': '-1.300', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.015', 'AMMO3': '0.039', 'AMMO4': '0.075', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon2': '0.348', 'WEAPON3': '0.400', 'weapon4': '0.604', 'weapon3': '1.082', 'weapon5': '1.752', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '5.050'} +[2023-09-14 12:52:01,904][102001] DAMAGECOUNT value on done: 2441.0 +[2023-09-14 12:52:01,904][102001] DAMAGECOUNT value on done: 2167.0 +[2023-09-14 12:52:01,905][102001] Sum rewards: 6.340, reward structure: {'HEALTH': '-4.650', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.019', 'AMMO5': '0.022', 'AMMO4': '0.095', 'AMMO3': '0.130', 'weapon2': '0.242', 'WEAPON4': '0.300', 'weapon5': '0.372', 'weapon4': '0.390', 'WEAPON5': '0.500', 'WEAPON3': '1.000', 'weapon3': '2.858', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '5.060'} +[2023-09-14 12:52:01,906][102001] Sum rewards: 5.795, reward structure: {'HEALTH': '-4.000', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.012', 'AMMO5': '0.025', 'AMMO4': '0.059', 'weapon4': '0.076', 'AMMO3': '0.135', 'WEAPON4': '0.200', 'weapon2': '0.378', 'WEAPON5': '0.500', 'weapon5': '0.772', 'WEAPON3': '1.000', 'weapon3': '2.688', 'DAMAGECOUNT': '3.950', 'FRAGCOUNT': '4.000'} +[2023-09-14 12:52:01,911][101964] Updated weights for policy 1, policy_version 1627 (0.0013) +[2023-09-14 12:52:02,198][101965] Updated weights for policy 0, policy_version 2475 (0.0013) +[2023-09-14 12:52:04,577][109198] Fps is (10 sec: 13516.8, 60 sec: 13994.7, 300 sec: 14190.2). Total num frames: 16834560. Throughput: 0: 1820.6, 1: 1645.6. Samples: 1676343. Policy #0 lag: (min: 0.0, avg: 0.7, max: 2.0) +[2023-09-14 12:52:04,579][109198] Avg episode reward: [(0, '4.674'), (1, '4.166')] +[2023-09-14 12:52:07,172][102037] DAMAGECOUNT value on done: 3396.0 +[2023-09-14 12:52:07,172][102037] DAMAGECOUNT value on done: 2920.0 +[2023-09-14 12:52:07,172][102037] Sum rewards: 2.104, reward structure: {'HEALTH': '-3.200', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO4': '0.016', 'AMMO5': '0.019', 'AMMO3': '0.102', 'WEAPON4': '0.200', 'weapon2': '0.396', 'WEAPON5': '0.400', 'weapon4': '0.450', 'WEAPON3': '0.800', 'weapon5': '0.826', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.850', 'weapon3': '2.242'} +[2023-09-14 12:52:07,173][102037] Sum rewards: 6.209, reward structure: {'HEALTH': '-1.850', 'DEATHCOUNT': '-1.000', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO3': '0.039', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.208', 'weapon2': '0.342', 'WEAPON3': '0.400', 'weapon3': '1.592', 'weapon5': '1.894', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.300'} +[2023-09-14 12:52:07,588][101965] Updated weights for policy 0, policy_version 2485 (0.0013) +[2023-09-14 12:52:07,729][102037] DAMAGECOUNT value on done: 1465.0 +[2023-09-14 12:52:07,729][102037] DAMAGECOUNT value on done: 1430.0 +[2023-09-14 12:52:07,730][102037] Sum rewards: 5.659, reward structure: {'HEALTH': '-0.850', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.346', 'weapon3': '0.758', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.100', 'weapon5': '3.010'} +[2023-09-14 12:52:07,928][102037] DAMAGECOUNT value on done: 3225.0 +[2023-09-14 12:52:07,929][102037] DAMAGECOUNT value on done: 3200.0 +[2023-09-14 12:52:07,929][102037] Sum rewards: 4.162, reward structure: {'DEATHCOUNT': '-4.000', 'HEALTH': '-4.000', 'HITCOUNT': '0.000', 'AMMO2': '0.014', 'AMMO5': '0.020', 'AMMO4': '0.069', 'AMMO3': '0.091', 'WEAPON4': '0.200', 'weapon2': '0.286', 'WEAPON5': '0.400', 'weapon4': '0.662', 'weapon5': '0.738', 'WEAPON3': '0.800', 'weapon3': '2.182', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.700'} +[2023-09-14 12:52:07,930][102037] Sum rewards: 6.431, reward structure: {'HEALTH': '-3.550', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.015', 'AMMO3': '0.064', 'AMMO4': '0.075', 'WEAPON5': '0.200', 'weapon5': '0.252', 'weapon2': '0.318', 'WEAPON4': '0.400', 'WEAPON3': '0.600', 'weapon4': '1.032', 'weapon3': '1.774', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.240'} +[2023-09-14 12:52:07,970][101964] Updated weights for policy 1, policy_version 1637 (0.0012) +[2023-09-14 12:52:08,168][102005] DAMAGECOUNT value on done: 1665.0 +[2023-09-14 12:52:08,169][102005] DAMAGECOUNT value on done: 1446.0 +[2023-09-14 12:52:08,169][102005] Sum rewards: 3.972, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.015', 'AMMO3': '0.040', 'AMMO4': '0.075', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon2': '0.424', 'weapon4': '0.586', 'weapon5': '0.956', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.000', 'weapon3': '1.216'} +[2023-09-14 12:52:08,170][102005] Sum rewards: 1.218, reward structure: {'HEALTH': '-3.150', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO5': '0.010', 'AMMO2': '0.010', 'AMMO4': '0.050', 'AMMO3': '0.089', 'WEAPON4': '0.200', 'weapon2': '0.236', 'weapon5': '0.264', 'WEAPON5': '0.300', 'weapon4': '0.392', 'WEAPON3': '0.800', 'FRAGCOUNT': '0.998', 'DAMAGECOUNT': '1.180', 'weapon3': '2.838'} +[2023-09-14 12:52:08,502][102037] DAMAGECOUNT value on done: 2491.0 +[2023-09-14 12:52:08,502][102037] DAMAGECOUNT value on done: 2428.0 +[2023-09-14 12:52:08,503][102037] Sum rewards: 3.711, reward structure: {'HEALTH': '-4.000', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.018', 'AMMO2': '0.027', 'AMMO4': '0.137', 'weapon5': '0.138', 'AMMO3': '0.144', 'WEAPON4': '0.300', 'WEAPON5': '0.400', 'weapon4': '0.532', 'weapon2': '0.766', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.999', 'weapon3': '2.500', 'DAMAGECOUNT': '3.750'} +[2023-09-14 12:52:08,503][102037] Sum rewards: 5.447, reward structure: {'HEALTH': '-3.100', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.011', 'AMMO5': '0.018', 'weapon4': '0.026', 'AMMO4': '0.056', 'AMMO3': '0.080', 'WEAPON4': '0.100', 'weapon5': '0.164', 'WEAPON5': '0.400', 'weapon2': '0.650', 'WEAPON3': '0.800', 'FRAGCOUNT': '2.999', 'weapon3': '3.092', 'DAMAGECOUNT': '3.150'} +[2023-09-14 12:52:08,709][102005] DAMAGECOUNT value on done: 2879.0 +[2023-09-14 12:52:08,709][102005] DAMAGECOUNT value on done: 2869.0 +[2023-09-14 12:52:08,709][102005] Sum rewards: 8.875, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.018', 'AMMO2': '-0.003', 'HITCOUNT': '0.000', 'AMMO5': '0.009', 'AMMO3': '0.064', 'WEAPON5': '0.200', 'weapon5': '0.314', 'WEAPON3': '0.600', 'weapon2': '1.088', 'weapon3': '2.272', 'FRAGCOUNT': '3.999', 'DAMAGECOUNT': '4.350'} +[2023-09-14 12:52:08,710][102005] Sum rewards: 0.354, reward structure: {'HEALTH': '-4.150', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.027', 'AMMO4': '0.134', 'AMMO3': '0.142', 'weapon5': '0.268', 'WEAPON4': '0.300', 'weapon4': '0.388', 'WEAPON5': '0.500', 'weapon2': '0.572', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.650', 'weapon3': '2.498'} +[2023-09-14 12:52:09,577][109198] Fps is (10 sec: 13926.4, 60 sec: 13994.7, 300 sec: 14190.2). Total num frames: 16904192. Throughput: 0: 1821.6, 1: 1648.5. Samples: 1697620. Policy #0 lag: (min: 0.0, avg: 0.6, max: 2.0) +[2023-09-14 12:52:09,579][109198] Avg episode reward: [(0, '4.592'), (1, '4.190')] +[2023-09-14 12:52:09,586][101802] Saving new best policy, reward=4.190! +[2023-09-14 12:52:11,646][102040] DAMAGECOUNT value on done: 1800.0 +[2023-09-14 12:52:11,646][102040] DAMAGECOUNT value on done: 1550.0 +[2023-09-14 12:52:11,647][102040] Sum rewards: 2.537, reward structure: {'HEALTH': '-3.850', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'weapon2': '0.006', 'AMMO5': '0.010', 'AMMO2': '0.011', 'AMMO4': '0.056', 'AMMO3': '0.102', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon4': '0.798', 'WEAPON3': '0.800', 'weapon5': '0.832', 'weapon3': '1.752', 'FRAGCOUNT': '2.000', 'DAMAGECOUNT': '2.520'} +[2023-09-14 12:52:11,647][102040] Sum rewards: 7.574, reward structure: {'HEALTH': '-2.400', 'DEATHCOUNT': '-2.000', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.000', 'AMMO5': '0.015', 'AMMO3': '0.064', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'weapon4': '0.320', 'weapon2': '0.380', 'WEAPON3': '0.600', 'weapon5': '1.038', 'weapon3': '2.158', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '4.000'} +[2023-09-14 12:52:12,221][102040] DAMAGECOUNT value on done: 1932.0 +[2023-09-14 12:52:12,222][102040] Sum rewards: 1.529, reward structure: {'HEALTH': '-6.400', 'DEATHCOUNT': '-6.000', 'HITCOUNT': '0.000', 'AMMO2': '0.021', 'AMMO5': '0.030', 'AMMO4': '0.102', 'AMMO3': '0.211', 'weapon2': '0.258', 'weapon5': '0.278', 'weapon4': '0.374', 'WEAPON4': '0.400', 'WEAPON5': '0.600', 'WEAPON3': '1.400', 'weapon3': '2.966', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '4.290'} +[2023-09-14 12:52:12,222][102040] DAMAGECOUNT value on done: 2063.0 +[2023-09-14 12:52:12,222][102040] Sum rewards: 9.384, reward structure: {'HEALTH': '-4.150', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.025', 'AMMO2': '0.044', 'weapon2': '0.108', 'AMMO3': '0.114', 'weapon5': '0.128', 'weapon4': '0.128', 'AMMO4': '0.219', 'WEAPON4': '0.300', 'WEAPON5': '0.500', 'WEAPON3': '1.000', 'weapon3': '3.568', 'FRAGCOUNT': '5.000', 'DAMAGECOUNT': '6.400'} +[2023-09-14 12:52:12,673][102005] DAMAGECOUNT value on done: 1473.0 +[2023-09-14 12:52:12,673][102005] DAMAGECOUNT value on done: 1646.0 +[2023-09-14 12:52:12,674][102005] Sum rewards: 1.265, reward structure: {'HEALTH': '-2.000', 'DEATHCOUNT': '-2.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'weapon2': '0.002', 'AMMO5': '0.009', 'AMMO2': '0.025', 'AMMO3': '0.079', 'AMMO4': '0.124', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.600', 'weapon4': '0.894', 'weapon3': '1.292', 'weapon5': '1.540'} +[2023-09-14 12:52:12,674][102005] Sum rewards: 4.087, reward structure: {'HEALTH': '-0.300', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO3': '0.020', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon2': '0.396', 'weapon5': '0.466', 'weapon3': '0.752', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.480'} +[2023-09-14 12:52:13,068][101965] Updated weights for policy 0, policy_version 2495 (0.0013) +[2023-09-14 12:52:13,221][102005] DAMAGECOUNT value on done: 3993.0 +[2023-09-14 12:52:13,221][102005] DAMAGECOUNT value on done: 4000.0 +[2023-09-14 12:52:13,221][102005] Sum rewards: 4.039, reward structure: {'HEALTH': '-4.150', 'DEATHCOUNT': '-4.000', 'HITCOUNT': '0.000', 'AMMO5': '0.024', 'AMMO2': '0.037', 'AMMO3': '0.125', 'weapon2': '0.148', 'AMMO4': '0.186', 'weapon4': '0.262', 'WEAPON4': '0.400', 'WEAPON5': '0.500', 'weapon5': '0.622', 'WEAPON3': '1.000', 'weapon3': '2.804', 'FRAGCOUNT': '3.000', 'DAMAGECOUNT': '3.080'} +[2023-09-14 12:52:13,222][102005] Sum rewards: 7.919, reward structure: {'HEALTH': '-3.000', 'DEATHCOUNT': '-3.000', 'HITCOUNT': '0.000', 'AMMO2': '0.018', 'AMMO5': '0.020', 'AMMO3': '0.078', 'weapon2': '0.078', 'AMMO4': '0.090', 'WEAPON5': '0.400', 'WEAPON4': '0.400', 'WEAPON3': '0.700', 'weapon5': '0.814', 'weapon4': '1.042', 'weapon3': '1.928', 'FRAGCOUNT': '4.000', 'DAMAGECOUNT': '4.350'} +[2023-09-14 12:52:13,352][109198] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 109198], exiting... +[2023-09-14 12:52:13,354][101802] Stopping Batcher_1... +[2023-09-14 12:52:13,354][101718] Stopping Batcher_0... +[2023-09-14 12:52:13,354][101802] Loop batcher_evt_loop terminating... +[2023-09-14 12:52:13,355][101802] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001646_6742016.pth... +[2023-09-14 12:52:13,355][101718] Loop batcher_evt_loop terminating... +[2023-09-14 12:52:13,356][101718] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002495_10219520.pth... +[2023-09-14 12:52:13,354][109198] Runner profile tree view: +main_loop: 501.4412 +[2023-09-14 12:52:13,357][109198] Collected {0: 10219520, 1: 6737920}, FPS: 13706.7 +[2023-09-14 12:52:13,382][101964] Weights refcount: 2 0 +[2023-09-14 12:52:13,383][101964] Stopping InferenceWorker_p1-w0... +[2023-09-14 12:52:13,383][101964] Loop inference_proc1-0_evt_loop terminating... +[2023-09-14 12:52:13,384][101965] Weights refcount: 2 0 +[2023-09-14 12:52:13,385][101965] Stopping InferenceWorker_p0-w0... +[2023-09-14 12:52:13,386][101965] Loop inference_proc0-0_evt_loop terminating... +[2023-09-14 12:52:13,415][101718] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002241_9179136.pth +[2023-09-14 12:52:13,421][101718] Stopping LearnerWorker_p0... +[2023-09-14 12:52:13,421][101718] Loop learner_proc0_evt_loop terminating... +[2023-09-14 12:52:13,432][101802] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001405_5754880.pth +[2023-09-14 12:52:13,444][101802] Stopping LearnerWorker_p1... +[2023-09-14 12:52:13,445][101802] Loop learner_proc1_evt_loop terminating... +[2023-09-14 12:52:14,165][102046] Stopping RolloutWorker_w7... +[2023-09-14 12:52:14,166][102046] Loop rollout_proc7_evt_loop terminating... +[2023-09-14 12:52:14,171][102005] Stopping RolloutWorker_w3... +[2023-09-14 12:52:14,172][102005] Loop rollout_proc3_evt_loop terminating... +[2023-09-14 12:52:14,174][102040] Stopping RolloutWorker_w6... +[2023-09-14 12:52:14,174][102003] Stopping RolloutWorker_w1... +[2023-09-14 12:52:14,174][102039] Stopping RolloutWorker_w5... +[2023-09-14 12:52:14,174][102004] Stopping RolloutWorker_w2... +[2023-09-14 12:52:14,175][102040] Loop rollout_proc6_evt_loop terminating... +[2023-09-14 12:52:14,175][102039] Loop rollout_proc5_evt_loop terminating... +[2023-09-14 12:52:14,175][102003] Loop rollout_proc1_evt_loop terminating... +[2023-09-14 12:52:14,175][102004] Loop rollout_proc2_evt_loop terminating... +[2023-09-14 12:52:14,177][102037] Stopping RolloutWorker_w4... +[2023-09-14 12:52:14,177][102037] Loop rollout_proc4_evt_loop terminating... +[2023-09-14 12:52:14,179][102001] Stopping RolloutWorker_w0... +[2023-09-14 12:52:14,180][102001] Loop rollout_proc0_evt_loop terminating... +[2023-09-14 12:54:01,880][109198] Environment doom_basic already registered, overwriting... +[2023-09-14 12:54:01,883][109198] Environment doom_two_colors_easy already registered, overwriting... +[2023-09-14 12:54:01,885][109198] Environment doom_two_colors_hard already registered, overwriting... +[2023-09-14 12:54:01,886][109198] Environment doom_dm already registered, overwriting... +[2023-09-14 12:54:01,888][109198] Environment doom_dwango5 already registered, overwriting... +[2023-09-14 12:54:01,889][109198] Environment doom_my_way_home_flat_actions already registered, overwriting... +[2023-09-14 12:54:01,891][109198] Environment doom_defend_the_center_flat_actions already registered, overwriting... +[2023-09-14 12:54:01,892][109198] Environment doom_my_way_home already registered, overwriting... +[2023-09-14 12:54:01,893][109198] Environment doom_deadly_corridor already registered, overwriting... +[2023-09-14 12:54:01,895][109198] Environment doom_defend_the_center already registered, overwriting... +[2023-09-14 12:54:01,896][109198] Environment doom_defend_the_line already registered, overwriting... +[2023-09-14 12:54:01,897][109198] Environment doom_health_gathering already registered, overwriting... +[2023-09-14 12:54:01,898][109198] Environment doom_health_gathering_supreme already registered, overwriting... +[2023-09-14 12:54:01,898][109198] Environment doom_battle already registered, overwriting... +[2023-09-14 12:54:01,899][109198] Environment doom_battle2 already registered, overwriting... +[2023-09-14 12:54:01,900][109198] Environment doom_duel_bots already registered, overwriting... +[2023-09-14 12:54:01,901][109198] Environment doom_deathmatch_bots already registered, overwriting... +[2023-09-14 12:54:01,902][109198] Environment doom_duel already registered, overwriting... +[2023-09-14 12:54:01,903][109198] Environment doom_deathmatch_full already registered, overwriting... +[2023-09-14 12:54:01,904][109198] Environment doom_benchmark already registered, overwriting... +[2023-09-14 12:54:01,905][109198] register_encoder_factory: +[2023-09-14 12:54:01,925][109198] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json +[2023-09-14 12:54:01,933][109198] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists! +[2023-09-14 12:54:01,934][109198] Resuming existing experiment from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment... +[2023-09-14 12:54:01,936][109198] Weights and Biases integration disabled +[2023-09-14 12:54:01,940][109198] Environment var CUDA_VISIBLE_DEVICES is 0,1 + +[2023-09-14 12:54:03,931][109198] Starting experiment with the following configuration: +help=False +algo=APPO +env=doom_duel +experiment=default_experiment +train_dir=/home/cogstack/Documents/optuna/environments/sample_factory/train_dir +restart_behavior=resume +device=gpu +seed=None +num_policies=2 +async_rl=True +serial_mode=False +batched_sampling=False +num_batches_to_accumulate=2 +worker_num_splits=2 +policy_workers_per_policy=1 +max_policy_lag=1000 +num_workers=8 +num_envs_per_worker=4 +batch_size=1024 +num_batches_per_epoch=1 +num_epochs=1 +rollout=32 +recurrence=32 +shuffle_minibatches=False +gamma=0.99 +reward_scale=1.0 +reward_clip=1000.0 +value_bootstrap=False +normalize_returns=True +exploration_loss_coeff=0.001 +value_loss_coeff=0.5 +kl_loss_coeff=0.0 +exploration_loss=symmetric_kl +gae_lambda=0.95 +ppo_clip_ratio=0.1 +ppo_clip_value=0.2 +with_vtrace=False +vtrace_rho=1.0 +vtrace_c=1.0 +optimizer=adam +adam_eps=1e-06 +adam_beta1=0.9 +adam_beta2=0.999 +max_grad_norm=4.0 +learning_rate=0.0001 +lr_schedule=constant +lr_schedule_kl_threshold=0.008 +lr_adaptive_min=1e-06 +lr_adaptive_max=0.01 +obs_subtract_mean=0.0 +obs_scale=255.0 +normalize_input=True +normalize_input_keys=None +decorrelate_experience_max_seconds=0 +decorrelate_envs_on_one_worker=True +actor_worker_gpus=[] +set_workers_cpu_affinity=True +force_envs_single_thread=False +default_niceness=0 +log_to_file=True +experiment_summaries_interval=10 +flush_summaries_interval=30 +stats_avg=100 +summaries_use_frameskip=True +heartbeat_interval=20 +heartbeat_reporting_interval=600 +train_for_env_steps=10000000 +train_for_seconds=10000000000 +save_every_sec=120 +keep_checkpoints=2 +load_checkpoint_kind=latest +save_milestones_sec=-1 +save_best_every_sec=5 +save_best_metric=reward +save_best_after=100000 +benchmark=False +encoder_mlp_layers=[512, 512] +encoder_conv_architecture=convnet_simple +encoder_conv_mlp_layers=[512] +use_rnn=True +rnn_size=512 +rnn_type=gru +rnn_num_layers=1 +decoder_mlp_layers=[] +nonlinearity=elu +policy_initialization=orthogonal +policy_init_gain=1.0 +actor_critic_share_weights=True +adaptive_stddev=True +continuous_tanh_scale=0.0 +initial_stddev=1.0 +use_env_info_cache=False +env_gpu_actions=False +env_gpu_observations=True +env_frameskip=4 +env_framestack=1 +pixel_format=CHW +use_record_episode_statistics=False +with_wandb=False +wandb_user=None +wandb_project=sample_factory +wandb_group=None +wandb_job_type=SF +wandb_tags=[] +with_pbt=False +pbt_mix_policies_in_one_env=True +pbt_period_env_steps=5000000 +pbt_start_mutation=20000000 +pbt_replace_fraction=0.3 +pbt_mutation_rate=0.15 +pbt_replace_reward_gap=0.1 +pbt_replace_reward_gap_absolute=1e-06 +pbt_optimize_gamma=False +pbt_target_objective=true_objective +pbt_perturb_min=1.1 +pbt_perturb_max=1.5 +num_agents=-1 +num_humans=0 +num_bots=-1 +start_bot_difficulty=None +timelimit=None +res_w=128 +res_h=72 +wide_aspect_ratio=False +eval_env_frameskip=1 +fps=35 +command_line=--env=doom_dm --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=20000000 +cli_args={'env': 'doom_dm', 'num_workers': 8, 'num_envs_per_worker': 4, 'train_for_env_steps': 20000000} +git_hash=20b6d44612dad7d171f23e13b1f3b4c5e5631cf9 +git_repo_name=https://github.com/MattStammers/optuna.git +[2023-09-14 12:54:03,933][109198] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... diff --git a/environments/sample_factory/wandb/latest-run b/environments/sample_factory/wandb/latest-run index 569faa1..64d5c62 120000 --- a/environments/sample_factory/wandb/latest-run +++ b/environments/sample_factory/wandb/latest-run @@ -1 +1 @@ -run-20230912_182125-default_experiment_20230912_165919_228624 \ No newline at end of file +run-20230914_125345-gopc2vgu \ No newline at end of file diff --git a/environments/unity/ml-agents b/environments/unity/ml-agents --- a/environments/unity/ml-agents +++ b/environments/unity/ml-agents @@ -1 +1 @@ -Subproject commit 8bcedabd808ffb7097f88b800fc92dea82dfd610 +Subproject commit 8bcedabd808ffb7097f88b800fc92dea82dfd610-dirty