diff --git a/environments/ai_vs_ai/ml-agents b/environments/ai_vs_ai/ml-agents --- a/environments/ai_vs_ai/ml-agents +++ b/environments/ai_vs_ai/ml-agents @@ -1 +1 @@ -Subproject commit 8bcedabd808ffb7097f88b800fc92dea82dfd610 +Subproject commit 8bcedabd808ffb7097f88b800fc92dea82dfd610-dirty diff --git a/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/0.monitor.csv b/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/0.monitor.csv index fb7057b..022e9b0 100644 --- a/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/0.monitor.csv +++ b/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/0.monitor.csv @@ -32220,3 +32220,7 @@ r,l,t 23050.0,10155,310929.782787 26000.0,11454,310943.878619 26325.0,12759,310959.764965 +15300.0,6347,310967.628622 +22950.0,11642,311015.595944 +15500.0,6612,311023.793262 +23025.0,10637,311037.115804 diff --git a/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/evaluations.npz b/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/evaluations.npz index 19b694c..3fe84a2 100644 Binary files a/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/evaluations.npz and b/environments/atari/model/qrdqn/QbertNoFrameskip-v4_6/evaluations.npz differ diff --git a/environments/sample_factory/doom_deathmatch.ipynb b/environments/sample_factory/doom_deathmatch.ipynb index 89dfc80..06e6f1a 100644 --- a/environments/sample_factory/doom_deathmatch.ipynb +++ b/environments/sample_factory/doom_deathmatch.ipynb @@ -11,21 +11,231 @@ }, { "cell_type": "code", - "execution_count": 1, + "execution_count": 11, "metadata": {}, "outputs": [], "source": [ - "import wandb\n", - "api = wandb.Api()\n", + "import wandb\n" + ] + }, + { + "cell_type": "code", + "execution_count": 35, + "metadata": {}, + "outputs": [ + { + "data": { + "text/html": [ + "Finishing last run (ID:cpaq4x6a) before initializing another..." + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "Waiting for W&B process to finish... (success)." + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "name": "stderr", + "output_type": "stream", + "text": [ + "wandb: WARNING Source type is set to 'repo' but some required information is missing from the environment. A job will not be created from this run. See https://docs.wandb.ai/guides/launch/create-job\n" + ] + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "c06e9e1e1e7b4e11aea23ac038b5113c", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "VBox(children=(Label(value='0.005 MB of 0.007 MB uploaded (0.000 MB deduped)\\r'), FloatProgress(value=0.612147…" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + " View run neat-sound-1 at: https://wandb.ai/matt-stammers/Doom_DeathMatch/runs/cpaq4x6a
Synced 4 W&B file(s), 0 media file(s), 0 artifact file(s) and 0 other file(s)" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "Find logs at: ./wandb/run-20230914_143444-cpaq4x6a/logs" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "Successfully finished last run (ID:cpaq4x6a). Initializing new run:
" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "b1e83eca47fd4cc396bfa54f88e76d3e", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "VBox(children=(Label(value='Waiting for wandb.init()...\\r'), FloatProgress(value=0.011120171700086858, max=1.0…" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "Tracking run with wandb version 0.15.10" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "Run data is saved locally in /home/cogstack/Documents/optuna/environments/sample_factory/wandb/run-20230914_143511-qiyz0kuy" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "Syncing run leafy-armadillo-2 to Weights & Biases (docs)
" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + " View project at https://wandb.ai/matt-stammers/Doom_DeathMatch" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + " View run at https://wandb.ai/matt-stammers/Doom_DeathMatch/runs/qiyz0kuy" + ], + "text/plain": [ + "" + ] + }, + "metadata": {}, + "output_type": "display_data" + }, + { + "data": { + "text/html": [ + "" + ], + "text/plain": [ + "" + ] + }, + "execution_count": 35, + "metadata": {}, + "output_type": "execute_result" + } + ], + "source": [ + "wandb.init(project=\"Doom_DeathMatch\")" + ] + }, + { + "cell_type": "code", + "execution_count": 23, + "metadata": {}, + "outputs": [ + { + "ename": "CommError", + "evalue": "Could not find run ", + "output_type": "error", + "traceback": [ + "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", + "\u001b[0;31mValueError\u001b[0m Traceback (most recent call last)", + "File \u001b[0;32m~/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/wandb/apis/normalize.py:41\u001b[0m, in \u001b[0;36mnormalize_exceptions..wrapper\u001b[0;34m(*args, **kwargs)\u001b[0m\n\u001b[1;32m 40\u001b[0m \u001b[39mtry\u001b[39;00m:\n\u001b[0;32m---> 41\u001b[0m \u001b[39mreturn\u001b[39;00m func(\u001b[39m*\u001b[39;49margs, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mkwargs)\n\u001b[1;32m 42\u001b[0m \u001b[39mexcept\u001b[39;00m requests\u001b[39m.\u001b[39mHTTPError \u001b[39mas\u001b[39;00m error:\n", + "File \u001b[0;32m~/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/wandb/apis/public.py:945\u001b[0m, in \u001b[0;36mApi.run\u001b[0;34m(self, path)\u001b[0m\n\u001b[1;32m 944\u001b[0m \u001b[39mif\u001b[39;00m \u001b[39mnot\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_runs\u001b[39m.\u001b[39mget(path):\n\u001b[0;32m--> 945\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_runs[path] \u001b[39m=\u001b[39m Run(\u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mclient, entity, project, run_id)\n\u001b[1;32m 946\u001b[0m \u001b[39mreturn\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_runs[path]\n", + "File \u001b[0;32m~/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/wandb/apis/public.py:1876\u001b[0m, in \u001b[0;36mRun.__init__\u001b[0;34m(self, client, entity, project, run_id, attrs, include_sweeps)\u001b[0m\n\u001b[1;32m 1874\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_state \u001b[39m=\u001b[39m _attrs\u001b[39m.\u001b[39mget(\u001b[39m\"\u001b[39m\u001b[39mstate\u001b[39m\u001b[39m\"\u001b[39m, \u001b[39m\"\u001b[39m\u001b[39mnot found\u001b[39m\u001b[39m\"\u001b[39m)\n\u001b[0;32m-> 1876\u001b[0m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mload(force\u001b[39m=\u001b[39;49m\u001b[39mnot\u001b[39;49;00m _attrs)\n", + "File \u001b[0;32m~/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/wandb/apis/public.py:1980\u001b[0m, in \u001b[0;36mRun.load\u001b[0;34m(self, force)\u001b[0m\n\u001b[1;32m 1975\u001b[0m \u001b[39mif\u001b[39;00m (\n\u001b[1;32m 1976\u001b[0m response \u001b[39mis\u001b[39;00m \u001b[39mNone\u001b[39;00m\n\u001b[1;32m 1977\u001b[0m \u001b[39mor\u001b[39;00m response\u001b[39m.\u001b[39mget(\u001b[39m\"\u001b[39m\u001b[39mproject\u001b[39m\u001b[39m\"\u001b[39m) \u001b[39mis\u001b[39;00m \u001b[39mNone\u001b[39;00m\n\u001b[1;32m 1978\u001b[0m \u001b[39mor\u001b[39;00m response[\u001b[39m\"\u001b[39m\u001b[39mproject\u001b[39m\u001b[39m\"\u001b[39m]\u001b[39m.\u001b[39mget(\u001b[39m\"\u001b[39m\u001b[39mrun\u001b[39m\u001b[39m\"\u001b[39m) \u001b[39mis\u001b[39;00m \u001b[39mNone\u001b[39;00m\n\u001b[1;32m 1979\u001b[0m ):\n\u001b[0;32m-> 1980\u001b[0m \u001b[39mraise\u001b[39;00m \u001b[39mValueError\u001b[39;00m(\u001b[39m\"\u001b[39m\u001b[39mCould not find run \u001b[39m\u001b[39m%s\u001b[39;00m\u001b[39m\"\u001b[39m \u001b[39m%\u001b[39m \u001b[39mself\u001b[39m)\n\u001b[1;32m 1981\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_attrs \u001b[39m=\u001b[39m response[\u001b[39m\"\u001b[39m\u001b[39mproject\u001b[39m\u001b[39m\"\u001b[39m][\u001b[39m\"\u001b[39m\u001b[39mrun\u001b[39m\u001b[39m\"\u001b[39m]\n", + "\u001b[0;31mValueError\u001b[0m: Could not find run ", + "\nDuring handling of the above exception, another exception occurred:\n", + "\u001b[0;31mCommError\u001b[0m Traceback (most recent call last)", + "\u001b[1;32m/home/cogstack/Documents/optuna/environments/sample_factory/doom_deathmatch.ipynb Cell 4\u001b[0m line \u001b[0;36m3\n\u001b[1;32m 1\u001b[0m api \u001b[39m=\u001b[39m wandb\u001b[39m.\u001b[39mApi()\n\u001b[0;32m----> 3\u001b[0m run \u001b[39m=\u001b[39m api\u001b[39m.\u001b[39;49mrun(\u001b[39m\"\u001b[39;49m\u001b[39mmatt-stammers/Doom_Duel/ethereal-star-2\u001b[39;49m\u001b[39m\"\u001b[39;49m)\n\u001b[1;32m 4\u001b[0m run\u001b[39m.\u001b[39mconfig[\u001b[39m\"\u001b[39m\u001b[39mkey\u001b[39m\u001b[39m\"\u001b[39m] \u001b[39m=\u001b[39m \u001b[39m\"\u001b[39m\u001b[39mworking_start\u001b[39m\u001b[39m\"\u001b[39m\n\u001b[1;32m 5\u001b[0m run\u001b[39m.\u001b[39mupdate()\n", + "File \u001b[0;32m~/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/wandb/apis/normalize.py:87\u001b[0m, in \u001b[0;36mnormalize_exceptions..wrapper\u001b[0;34m(*args, **kwargs)\u001b[0m\n\u001b[1;32m 85\u001b[0m \u001b[39mraise\u001b[39;00m\n\u001b[1;32m 86\u001b[0m \u001b[39melse\u001b[39;00m:\n\u001b[0;32m---> 87\u001b[0m \u001b[39mraise\u001b[39;00m CommError(message, err)\u001b[39m.\u001b[39mwith_traceback(sys\u001b[39m.\u001b[39mexc_info()[\u001b[39m2\u001b[39m])\n", + "File \u001b[0;32m~/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/wandb/apis/normalize.py:41\u001b[0m, in \u001b[0;36mnormalize_exceptions..wrapper\u001b[0;34m(*args, **kwargs)\u001b[0m\n\u001b[1;32m 39\u001b[0m message \u001b[39m=\u001b[39m \u001b[39m\"\u001b[39m\u001b[39mWhoa, you found a bug.\u001b[39m\u001b[39m\"\u001b[39m\n\u001b[1;32m 40\u001b[0m \u001b[39mtry\u001b[39;00m:\n\u001b[0;32m---> 41\u001b[0m \u001b[39mreturn\u001b[39;00m func(\u001b[39m*\u001b[39;49margs, \u001b[39m*\u001b[39;49m\u001b[39m*\u001b[39;49mkwargs)\n\u001b[1;32m 42\u001b[0m \u001b[39mexcept\u001b[39;00m requests\u001b[39m.\u001b[39mHTTPError \u001b[39mas\u001b[39;00m error:\n\u001b[1;32m 43\u001b[0m errors \u001b[39m=\u001b[39m parse_backend_error_messages(error\u001b[39m.\u001b[39mresponse)\n", + "File \u001b[0;32m~/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/wandb/apis/public.py:945\u001b[0m, in \u001b[0;36mApi.run\u001b[0;34m(self, path)\u001b[0m\n\u001b[1;32m 943\u001b[0m entity, project, run_id \u001b[39m=\u001b[39m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_parse_path(path)\n\u001b[1;32m 944\u001b[0m \u001b[39mif\u001b[39;00m \u001b[39mnot\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_runs\u001b[39m.\u001b[39mget(path):\n\u001b[0;32m--> 945\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_runs[path] \u001b[39m=\u001b[39m Run(\u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mclient, entity, project, run_id)\n\u001b[1;32m 946\u001b[0m \u001b[39mreturn\u001b[39;00m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_runs[path]\n", + "File \u001b[0;32m~/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/wandb/apis/public.py:1876\u001b[0m, in \u001b[0;36mRun.__init__\u001b[0;34m(self, client, entity, project, run_id, attrs, include_sweeps)\u001b[0m\n\u001b[1;32m 1873\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_metadata: Optional[Dict[\u001b[39mstr\u001b[39m, Any]] \u001b[39m=\u001b[39m \u001b[39mNone\u001b[39;00m\n\u001b[1;32m 1874\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_state \u001b[39m=\u001b[39m _attrs\u001b[39m.\u001b[39mget(\u001b[39m\"\u001b[39m\u001b[39mstate\u001b[39m\u001b[39m\"\u001b[39m, \u001b[39m\"\u001b[39m\u001b[39mnot found\u001b[39m\u001b[39m\"\u001b[39m)\n\u001b[0;32m-> 1876\u001b[0m \u001b[39mself\u001b[39;49m\u001b[39m.\u001b[39;49mload(force\u001b[39m=\u001b[39;49m\u001b[39mnot\u001b[39;49;00m _attrs)\n", + "File \u001b[0;32m~/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/wandb/apis/public.py:1980\u001b[0m, in \u001b[0;36mRun.load\u001b[0;34m(self, force)\u001b[0m\n\u001b[1;32m 1974\u001b[0m response \u001b[39m=\u001b[39m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_exec(query)\n\u001b[1;32m 1975\u001b[0m \u001b[39mif\u001b[39;00m (\n\u001b[1;32m 1976\u001b[0m response \u001b[39mis\u001b[39;00m \u001b[39mNone\u001b[39;00m\n\u001b[1;32m 1977\u001b[0m \u001b[39mor\u001b[39;00m response\u001b[39m.\u001b[39mget(\u001b[39m\"\u001b[39m\u001b[39mproject\u001b[39m\u001b[39m\"\u001b[39m) \u001b[39mis\u001b[39;00m \u001b[39mNone\u001b[39;00m\n\u001b[1;32m 1978\u001b[0m \u001b[39mor\u001b[39;00m response[\u001b[39m\"\u001b[39m\u001b[39mproject\u001b[39m\u001b[39m\"\u001b[39m]\u001b[39m.\u001b[39mget(\u001b[39m\"\u001b[39m\u001b[39mrun\u001b[39m\u001b[39m\"\u001b[39m) \u001b[39mis\u001b[39;00m \u001b[39mNone\u001b[39;00m\n\u001b[1;32m 1979\u001b[0m ):\n\u001b[0;32m-> 1980\u001b[0m \u001b[39mraise\u001b[39;00m \u001b[39mValueError\u001b[39;00m(\u001b[39m\"\u001b[39m\u001b[39mCould not find run \u001b[39m\u001b[39m%s\u001b[39;00m\u001b[39m\"\u001b[39m \u001b[39m%\u001b[39m \u001b[39mself\u001b[39m)\n\u001b[1;32m 1981\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_attrs \u001b[39m=\u001b[39m response[\u001b[39m\"\u001b[39m\u001b[39mproject\u001b[39m\u001b[39m\"\u001b[39m][\u001b[39m\"\u001b[39m\u001b[39mrun\u001b[39m\u001b[39m\"\u001b[39m]\n\u001b[1;32m 1982\u001b[0m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_state \u001b[39m=\u001b[39m \u001b[39mself\u001b[39m\u001b[39m.\u001b[39m_attrs[\u001b[39m\"\u001b[39m\u001b[39mstate\u001b[39m\u001b[39m\"\u001b[39m]\n", + "\u001b[0;31mCommError\u001b[0m: Could not find run " + ] + } + ], + "source": [ + "# api = wandb.Api()\n", "\n", - "run = api.run(\"matt-stammers/sample_factory/default_experiment_20230912_141858_570479\")\n", - "run.config[\"key\"] = \"default_experiment_deathmatch\"\n", - "run.update()" + "# run = api.run(\"matt-stammers/Doom_Duel/ethereal-star-2\")\n", + "# run.config[\"key\"] = \"working_start\"\n", + "# run.update()" ] }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 15, "metadata": {}, "outputs": [], "source": [ @@ -73,60 +283,63 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 37, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ - "\u001b[33m[2023-09-12 21:01:43,594][28625] Environment doom_basic already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,596][28625] Environment doom_two_colors_easy already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,599][28625] Environment doom_two_colors_hard already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,601][28625] Environment doom_dm already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,603][28625] Environment doom_dwango5 already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,604][28625] Environment doom_my_way_home_flat_actions already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,605][28625] Environment doom_defend_the_center_flat_actions already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,606][28625] Environment doom_my_way_home already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,607][28625] Environment doom_deadly_corridor already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,608][28625] Environment doom_defend_the_center already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,610][28625] Environment doom_defend_the_line already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,611][28625] Environment doom_health_gathering already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,613][28625] Environment doom_health_gathering_supreme already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,613][28625] Environment doom_battle already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,614][28625] Environment doom_battle2 already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,614][28625] Environment doom_duel_bots already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,615][28625] Environment doom_deathmatch_bots already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,616][28625] Environment doom_duel already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,616][28625] Environment doom_deathmatch_full already registered, overwriting...\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,617][28625] Environment doom_benchmark already registered, overwriting...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:43,617][28625] register_encoder_factory: \u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:43,646][28625] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:43,650][28625] Overriding arg 'train_for_env_steps' with value 1000000 passed from command line\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:43,659][28625] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:43,661][28625] Resuming existing experiment from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:43,661][28625] Weights and Biases integration disabled\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:43,664][28625] Environment var CUDA_VISIBLE_DEVICES is 0,1\n", + "\u001b[33m[2023-09-14 14:36:27,406][109198] Environment doom_basic already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,407][109198] Environment doom_two_colors_easy already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,409][109198] Environment doom_two_colors_hard already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,410][109198] Environment doom_dm already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,414][109198] Environment doom_dwango5 already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,415][109198] Environment doom_my_way_home_flat_actions already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,415][109198] Environment doom_defend_the_center_flat_actions already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,416][109198] Environment doom_my_way_home already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,417][109198] Environment doom_deadly_corridor already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,417][109198] Environment doom_defend_the_center already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,418][109198] Environment doom_defend_the_line already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,418][109198] Environment doom_health_gathering already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,419][109198] Environment doom_health_gathering_supreme already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,420][109198] Environment doom_battle already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,421][109198] Environment doom_battle2 already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,422][109198] Environment doom_duel_bots already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,423][109198] Environment doom_deathmatch_bots already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,424][109198] Environment doom_duel already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,425][109198] Environment doom_deathmatch_full already registered, overwriting...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,425][109198] Environment doom_benchmark already registered, overwriting...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:27,426][109198] register_encoder_factory: \u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:27,445][109198] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:27,450][109198] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists!\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:27,451][109198] Moving the existing experiment dir to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment_old0014...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:27,452][109198] Starting training in /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:27,453][109198] Weights and Biases integration disabled\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:27,458][109198] Environment var CUDA_VISIBLE_DEVICES is 0,1\n", "\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:45,348][39338] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:45,376][39338] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,146][63242] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,148][63242] Port 40300 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,148][63242] Using port 40300\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.num_agents to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.num_agents` for environment variables or `env.get_wrapper_attr('num_agents')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.is_multiagent to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.is_multiagent` for environment variables or `env.get_wrapper_attr('is_multiagent')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[36m[2023-09-12 21:01:45,378][39338] Env info: EnvInfo(obs_space=Dict('measurements': Box([ 0. 0. -1. -1. -50. 0. 0. 0. 0. 0. 0. 0. 0. 0.\n", + "\u001b[36m[2023-09-14 14:36:29,149][63242] Env info: EnvInfo(obs_space=Dict('measurements': Box([ 0. 0. -1. -1. -50. 0. 0. 0. 0. 0. 0. 0. 0. 0.\n", " 0. 0. 0. 0. 0. 0. 0. 0. 0.], [20. 50. 50. 50. 50. 1. 10. 5. 5. 5. 5. 5. 5. 5. 5. 50. 50. 50.\n", - " 50. 50. 50. 50. 50.], (23,), float32), 'obs': Box(0, 255, (3, 72, 128), uint8)), action_space=Tuple(Discrete(3), Discrete(3), Discrete(3), Discrete(2), Discrete(2), Box(-1.0, 1.0, (1,), float32)), num_agents=8, gpu_actions=False, gpu_observations=True, action_splits=[1, 1, 1, 1, 1, 1], all_discrete=False, frameskip=4, reward_shaping_scheme={'delta': {'FRAGCOUNT': (1, -0.001), 'DEATHCOUNT': (-1, 1), 'HITCOUNT': (0, 0), 'DAMAGECOUNT': (0.01, -0.01), 'HEALTH': (0.01, -0.01), 'ARMOR': (0.005, -0.001), 'WEAPON0': (0.02, -0.01), 'AMMO0': (0.0002, -0.0001), 'WEAPON1': (0.02, -0.01), 'AMMO1': (0.0002, -0.0001), 'WEAPON2': (0.02, -0.01), 'AMMO2': (0.0002, -0.0001), 'WEAPON3': (0.1, -0.05), 'AMMO3': (0.001, -0.0005), 'WEAPON4': (0.1, -0.05), 'AMMO4': (0.001, -0.0005), 'WEAPON5': (0.1, -0.05), 'AMMO5': (0.001, -0.0005), 'WEAPON6': (0.2, -0.1), 'AMMO6': (0.002, -0.001), 'WEAPON7': (0.2, -0.1), 'AMMO7': (0.002, -0.001)}, 'selected_weapon': {'SELECTED0': 0.0002, 'SELECTED1': 0.0002, 'SELECTED2': 0.0002, 'SELECTED3': 0.001, 'SELECTED4': 0.001, 'SELECTED5': 0.001, 'SELECTED6': 0.002, 'SELECTED7': 0.002}}, env_info_protocol_version=1)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:45,745][28625] Starting experiment with the following configuration:\n", + " 50. 50. 50. 50. 50.], (23,), float32), 'obs': Box(0, 255, (3, 72, 128), uint8)), action_space=Tuple(Discrete(3), Discrete(3), Discrete(8), Discrete(2), Discrete(2), Discrete(21)), num_agents=1, gpu_actions=False, gpu_observations=True, action_splits=[1, 1, 1, 1, 1, 1], all_discrete=True, frameskip=4, reward_shaping_scheme={'delta': {'FRAGCOUNT': (1, -1.5), 'DEATHCOUNT': (-0.75, 0.75), 'HITCOUNT': (0.01, -0.01), 'DAMAGECOUNT': (0.003, -0.003), 'HEALTH': (0.005, -0.003), 'ARMOR': (0.005, -0.001), 'WEAPON0': (0.02, -0.01), 'AMMO0': (0.0002, -0.0001), 'WEAPON1': (0.02, -0.01), 'AMMO1': (0.0002, -0.0001), 'WEAPON2': (0.02, -0.01), 'AMMO2': (0.0002, -0.0001), 'WEAPON3': (0.1, -0.05), 'AMMO3': (0.001, -0.0005), 'WEAPON4': (0.1, -0.05), 'AMMO4': (0.001, -0.0005), 'WEAPON5': (0.1, -0.05), 'AMMO5': (0.001, -0.0005), 'WEAPON6': (0.2, -0.1), 'AMMO6': (0.002, -0.001), 'WEAPON7': (0.2, -0.1), 'AMMO7': (0.002, -0.001)}, 'selected_weapon': {'SELECTED0': 0.0002, 'SELECTED1': 0.0002, 'SELECTED2': 0.0002, 'SELECTED3': 0.001, 'SELECTED4': 0.001, 'SELECTED5': 0.001, 'SELECTED6': 0.002, 'SELECTED7': 0.002}}, env_info_protocol_version=1)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,541][109198] Starting experiment with the following configuration:\n", "help=False\n", "algo=APPO\n", - "env=doom_dwango5\n", + "env=doom_deathmatch_bots\n", "experiment=default_experiment\n", "train_dir=/home/cogstack/Documents/optuna/environments/sample_factory/train_dir\n", - "restart_behavior=resume\n", + "restart_behavior=restart\n", "device=gpu\n", "seed=None\n", - "num_policies=1\n", + "num_policies=2\n", "async_rl=True\n", "serial_mode=False\n", "batched_sampling=False\n", @@ -184,7 +397,7 @@ "summaries_use_frameskip=True\n", "heartbeat_interval=20\n", "heartbeat_reporting_interval=600\n", - "train_for_env_steps=1000000\n", + "train_for_env_steps=10000000\n", "train_for_seconds=10000000000\n", "save_every_sec=120\n", "keep_checkpoints=2\n", @@ -248,44 +461,116 @@ "cli_args={'env': 'doom_dm', 'num_workers': 8, 'num_envs_per_worker': 4, 'train_for_env_steps': 20000000}\n", "git_hash=20b6d44612dad7d171f23e13b1f3b4c5e5631cf9\n", "git_repo_name=https://github.com/MattStammers/optuna.git\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:45,747][28625] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,757][28625] Rollout worker 0 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,758][28625] Rollout worker 1 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,760][28625] Rollout worker 2 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,761][28625] Rollout worker 3 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,763][28625] Rollout worker 4 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,765][28625] Rollout worker 5 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,767][28625] Rollout worker 6 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,768][28625] Rollout worker 7 uses device cpu\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,937][28625] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:46,939][28625] InferenceWorker_p0-w0: min num requests: 2\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,973][28625] Starting all processes...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:46,974][28625] Starting process learner_proc0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,713][28625] Starting all processes...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:48,713][39537] LearnerWorker_p0\tpid 39537\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,714][39537] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:48,714][39537] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,719][28625] Starting process inference_proc0-0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,719][28625] Starting process rollout_proc0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,720][28625] Starting process rollout_proc1\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,720][28625] Starting process rollout_proc2\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,725][28625] Starting process rollout_proc3\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,725][28625] Starting process rollout_proc4\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,725][28625] Starting process rollout_proc5\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,759][39537] Num visible devices: 1\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,726][28625] Starting process rollout_proc6\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,726][28625] Starting process rollout_proc7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:48,796][39537] Starting seed is not provided\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,797][39537] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,797][39537] Initializing actor-critic model on device cuda:0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,797][39537] RunningMeanStd input shape: (23,)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,798][39537] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,798][39537] RunningMeanStd input shape: (1,)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,810][39537] ConvEncoder: input_channels=3\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,954][39537] Conv encoder output size: 512\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,956][39537] Policy head output size: 640\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,984][39537] Created Actor Critic model with architecture:\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:48,986][39537] ActorCriticSharedWeights(\n", + "\u001b[36m[2023-09-14 14:36:29,543][109198] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,664][109198] Rollout worker 0 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,666][109198] Rollout worker 1 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,668][109198] Rollout worker 2 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,669][109198] Rollout worker 3 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,671][109198] Rollout worker 4 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,673][109198] Rollout worker 5 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,674][109198] Rollout worker 6 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,676][109198] Rollout worker 7 uses device cpu\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,741][109198] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:29,742][109198] InferenceWorker_p0-w0: min num requests: 1\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,746][109198] Using GPUs [1] for process 1 (actually maps to GPUs [1])\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:29,747][109198] InferenceWorker_p1-w0: min num requests: 1\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,774][109198] Starting all processes...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:29,776][109198] Starting process learner_proc0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:31,457][109198] Starting process learner_proc1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:31,458][63454] LearnerWorker_p0\tpid 63454\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:31,459][63454] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:31,459][63454] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:31,477][63454] Num visible devices: 1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:31,496][63454] Starting seed is not provided\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:31,496][63454] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:31,497][63454] Initializing actor-critic model on device cuda:0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:31,497][63454] RunningMeanStd input shape: (23,)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:31,497][63454] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:31,498][63454] RunningMeanStd input shape: (1,)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:31,509][63454] ConvEncoder: input_channels=3\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:31,620][63454] Conv encoder output size: 512\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:31,622][63454] Policy head output size: 640\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:31,639][63454] Created Actor Critic model with architecture:\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:31,639][63454] ActorCriticSharedWeights(\n", + " (obs_normalizer): ObservationNormalizer(\n", + " (running_mean_std): RunningMeanStdDictInPlace(\n", + " (running_mean_std): ModuleDict(\n", + " (measurements): RunningMeanStdInPlace()\n", + " (obs): RunningMeanStdInPlace()\n", + " )\n", + " )\n", + " )\n", + " (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace)\n", + " (encoder): VizdoomEncoder(\n", + " (basic_encoder): ConvEncoder(\n", + " (enc): RecursiveScriptModule(\n", + " original_name=ConvEncoderImpl\n", + " (conv_head): RecursiveScriptModule(\n", + " original_name=Sequential\n", + " (0): RecursiveScriptModule(original_name=Conv2d)\n", + " (1): RecursiveScriptModule(original_name=ELU)\n", + " (2): RecursiveScriptModule(original_name=Conv2d)\n", + " (3): RecursiveScriptModule(original_name=ELU)\n", + " (4): RecursiveScriptModule(original_name=Conv2d)\n", + " (5): RecursiveScriptModule(original_name=ELU)\n", + " )\n", + " (mlp_layers): RecursiveScriptModule(\n", + " original_name=Sequential\n", + " (0): RecursiveScriptModule(original_name=Linear)\n", + " (1): RecursiveScriptModule(original_name=ELU)\n", + " )\n", + " )\n", + " )\n", + " (measurements_head): Sequential(\n", + " (0): Linear(in_features=23, out_features=128, bias=True)\n", + " (1): ELU(alpha=1.0)\n", + " (2): Linear(in_features=128, out_features=128, bias=True)\n", + " (3): ELU(alpha=1.0)\n", + " )\n", + " )\n", + " (core): ModelCoreRNN(\n", + " (core): GRU(640, 512)\n", + " )\n", + " (decoder): MlpDecoder(\n", + " (mlp): Identity()\n", + " )\n", + " (critic_linear): Linear(in_features=512, out_features=1, bias=True)\n", + " (action_parameterization): ActionParameterizationDefault(\n", + " (distribution_linear): Linear(in_features=512, out_features=39, bias=True)\n", + " )\n", + ")\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:32,540][63454] Using optimizer \u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:32,541][63454] No checkpoints found\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:32,541][63454] Did not load from checkpoint, starting from scratch!\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:32,541][63454] Initialized policy 0 weights for model version 0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:32,543][63454] LearnerWorker_p0 finished initialization!\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:32,543][63454] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,025][109198] Starting all processes...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:33,025][63576] LearnerWorker_p1\tpid 63576\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,026][63576] Using GPUs [1] for process 1 (actually maps to GPUs [1])\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:33,026][63576] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for learning process 1\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,032][109198] Starting process inference_proc0-0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,034][109198] Starting process inference_proc1-0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,034][109198] Starting process rollout_proc0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,035][109198] Starting process rollout_proc1\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,035][109198] Starting process rollout_proc2\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,035][109198] Starting process rollout_proc3\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,064][63576] Num visible devices: 1\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,036][109198] Starting process rollout_proc4\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,037][109198] Starting process rollout_proc5\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,038][109198] Starting process rollout_proc6\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,038][109198] Starting process rollout_proc7\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:33,107][63576] Starting seed is not provided\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,108][63576] Using GPUs [0] for process 1 (actually maps to GPUs [1])\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,108][63576] Initializing actor-critic model on device cuda:0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,108][63576] RunningMeanStd input shape: (23,)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,109][63576] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,109][63576] RunningMeanStd input shape: (1,)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,130][63576] ConvEncoder: input_channels=3\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,386][63576] Conv encoder output size: 512\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,387][63576] Policy head output size: 640\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,417][63576] Created Actor Critic model with architecture:\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:33,418][63576] ActorCriticSharedWeights(\n", " (obs_normalizer): ObservationNormalizer(\n", " (running_mean_std): RunningMeanStdDictInPlace(\n", " (running_mean_std): ModuleDict(\n", @@ -330,6747 +615,6805 @@ " )\n", " (critic_linear): Linear(in_features=512, out_features=1, bias=True)\n", " (action_parameterization): ActionParameterizationDefault(\n", - " (distribution_linear): Linear(in_features=512, out_features=15, bias=True)\n", + " (distribution_linear): Linear(in_features=512, out_features=39, bias=True)\n", " )\n", ")\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,408][39537] Using optimizer \u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:50,409][39537] No checkpoints found\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,409][39537] Did not load from checkpoint, starting from scratch!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,409][39537] Initialized policy 0 weights for model version 0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,412][39537] LearnerWorker_p0 finished initialization!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,412][39537] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,709][39685] Rollout worker 0 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,709][39685] ROLLOUT worker 0\tpid 39685\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,710][39685] Worker 0 uses CPU cores [0, 1, 2, 3]\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,780][39698] Rollout worker 3 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,780][39698] ROLLOUT worker 3\tpid 39698\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,780][39698] Worker 3 uses CPU cores [12, 13, 14, 15]\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,818][39731] Rollout worker 4 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,818][39731] ROLLOUT worker 4\tpid 39731\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,819][39731] Worker 4 uses CPU cores [16, 17, 18, 19]\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,855][39734] Rollout worker 7 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,855][39734] ROLLOUT worker 7\tpid 39734\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,857][39734] Worker 7 uses CPU cores [28, 29, 30, 31]\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,880][39699] Rollout worker 5 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,880][39699] ROLLOUT worker 5\tpid 39699\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,881][39699] Worker 5 uses CPU cores [20, 21, 22, 23]\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,915][39686] InferenceWorker_p0-w0\tpid 39686\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,915][39686] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,915][39686] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,927][39696] Rollout worker 2 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,927][39696] ROLLOUT worker 2\tpid 39696\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,931][39696] Worker 2 uses CPU cores [8, 9, 10, 11]\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,954][39686] Num visible devices: 1\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,991][39733] Rollout worker 6 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:50,991][39733] ROLLOUT worker 6\tpid 39733\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:50,992][39733] Worker 6 uses CPU cores [24, 25, 26, 27]\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,090][39697] Rollout worker 1 starting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:51,090][39697] ROLLOUT worker 1\tpid 39697\tparent 28625\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,090][39697] Worker 1 uses CPU cores [4, 5, 6, 7]\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,618][39686] RunningMeanStd input shape: (23,)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,618][39686] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,618][39686] RunningMeanStd input shape: (1,)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,630][39686] ConvEncoder: input_channels=3\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,739][39686] Conv encoder output size: 512\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:51,740][39686] Policy head output size: 640\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,083][28625] Inference worker 0-0 is ready!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,085][28625] All inference workers are ready! Signal rollout workers to start!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,088][39685] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,090][39698] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,091][39734] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,092][39696] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,092][39699] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,092][39697] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,093][39731] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,094][39733] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,118][39685] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,121][39685] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,124][39734] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,125][39697] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,125][39699] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,126][39696] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,127][39731] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,128][39734] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,129][39697] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,129][39699] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,129][39696] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,130][39731] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,134][39698] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,139][39733] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,139][39698] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,143][39733] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,151][39685] Port 40300 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,151][39685] Using port 40300\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,152][39685] Initializing env for player 0, init_info: {'port': 40300}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,160][39697] Port 40400 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,160][39697] Using port 40400\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,161][39696] Port 40500 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,161][39699] Port 40800 is available\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,161][39697] Initializing env for player 0, init_info: {'port': 40400}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,161][39696] Using port 40500\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,161][39699] Using port 40800\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,161][39734] Port 41000 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,161][39734] Using port 41000\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,162][39696] Initializing env for player 0, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,162][39699] Initializing env for player 0, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,163][39734] Initializing env for player 0, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,176][39733] Port 40900 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,176][39733] Using port 40900\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,177][39733] Initializing env for player 0, init_info: {'port': 40900}...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:34,638][63576] Using optimizer \u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:34,639][63576] No checkpoints found\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:34,639][63576] Did not load from checkpoint, starting from scratch!\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:34,639][63576] Initialized policy 1 weights for model version 0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:34,641][63576] LearnerWorker_p1 finished initialization!\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:34,641][63576] Using GPUs [0] for process 1 (actually maps to GPUs [1])\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:34,966][63732] InferenceWorker_p0-w0\tpid 63732\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:34,966][63732] Using GPUs [0] for process 0 (actually maps to GPUs [0])\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:34,966][63732] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:34,984][63732] Num visible devices: 1\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,023][63734] Rollout worker 1 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:35,023][63734] ROLLOUT worker 1\tpid 63734\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,027][63734] Worker 1 uses CPU cores [4, 5, 6, 7]\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,039][63806] Rollout worker 7 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:35,039][63806] ROLLOUT worker 7\tpid 63806\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,040][63806] Worker 7 uses CPU cores [28, 29, 30, 31]\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,095][63770] Rollout worker 4 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:35,095][63770] ROLLOUT worker 4\tpid 63770\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,099][63770] Worker 4 uses CPU cores [16, 17, 18, 19]\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,180][63769] Rollout worker 3 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:35,180][63769] ROLLOUT worker 3\tpid 63769\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,180][63769] Worker 3 uses CPU cores [12, 13, 14, 15]\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,288][63771] Rollout worker 5 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:35,288][63771] ROLLOUT worker 5\tpid 63771\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,289][63771] Worker 5 uses CPU cores [20, 21, 22, 23]\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,305][63767] Rollout worker 2 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:35,305][63767] ROLLOUT worker 2\tpid 63767\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,305][63767] Worker 2 uses CPU cores [8, 9, 10, 11]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:35,342][63733] InferenceWorker_p1-w0\tpid 63733\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,343][63733] Using GPUs [1] for process 1 (actually maps to GPUs [1])\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:35,343][63733] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for inference process 1\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,362][63733] Num visible devices: 1\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,502][63805] Rollout worker 6 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:35,502][63805] ROLLOUT worker 6\tpid 63805\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,504][63805] Worker 6 uses CPU cores [24, 25, 26, 27]\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,538][63735] Rollout worker 0 starting...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:35,538][63735] ROLLOUT worker 0\tpid 63735\tparent 109198\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,539][63735] Worker 0 uses CPU cores [0, 1, 2, 3]\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,629][63732] RunningMeanStd input shape: (23,)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,629][63732] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,630][63732] RunningMeanStd input shape: (1,)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,642][63732] ConvEncoder: input_channels=3\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,747][63732] Conv encoder output size: 512\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:35,748][63732] Policy head output size: 640\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,012][63733] RunningMeanStd input shape: (23,)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,012][63733] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,013][63733] RunningMeanStd input shape: (1,)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,024][63733] ConvEncoder: input_channels=3\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,029][109198] Inference worker 0-0 is ready!\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,126][63733] Conv encoder output size: 512\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,127][63733] Policy head output size: 640\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,405][109198] Inference worker 1-0 is ready!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,406][109198] All inference workers are ready! Signal rollout workers to start!\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,442][63735] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,444][63735] Port 40300 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,444][63735] Using port 40300\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.num_agents to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.num_agents` for environment variables or `env.get_wrapper_attr('num_agents')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.is_multiagent to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.is_multiagent` for environment variables or `env.get_wrapper_attr('is_multiagent')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "\u001b[36m[2023-09-14 14:36:36,446][63734] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,447][63806] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,447][63769] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,447][63767] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,448][63805] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,448][63734] Port 40400 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,449][63734] Using port 40400\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:36,449][63806] UDP port 41000 cannot be used [Errno 98] Address already in use\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,449][63769] Port 40600 is available\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "\u001b[36m[2023-09-14 14:36:36,449][63769] Using port 40600\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,449][63806] Port 42000 is available\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.num_agents to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.num_agents` for environment variables or `env.get_wrapper_attr('num_agents')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "\u001b[36m[2023-09-14 14:36:36,449][63806] Using port 42000\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.is_multiagent to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.is_multiagent` for environment variables or `env.get_wrapper_attr('is_multiagent')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,185][39685] Using port 40300 on host...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,186][39698] Port 40600 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,186][39698] Using port 40600\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,187][39698] Initializing env for player 0, init_info: {'port': 40600}...\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,193][39734] Using port 41000 on host...\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.num_agents to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.num_agents` for environment variables or `env.get_wrapper_attr('num_agents')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.is_multiagent to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.is_multiagent` for environment variables or `env.get_wrapper_attr('is_multiagent')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.num_agents to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.num_agents` for environment variables or `env.get_wrapper_attr('num_agents')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.is_multiagent to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.is_multiagent` for environment variables or `env.get_wrapper_attr('is_multiagent')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "\u001b[36m[2023-09-14 14:36:36,449][63767] Port 40500 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,450][63767] Using port 40500\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,195][39696] Using port 40500 on host...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,197][39731] Port 40700 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:52,197][39731] Using port 40700\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,202][39685] Initializing env for player 1, init_info: {'port': 40300}...\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.num_agents to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.num_agents` for environment variables or `env.get_wrapper_attr('num_agents')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.is_multiagent to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.is_multiagent` for environment variables or `env.get_wrapper_attr('is_multiagent')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "\u001b[36m[2023-09-14 14:36:36,451][63805] Port 40900 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,451][63805] Using port 40900\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,207][39733] Using port 40900 on host...\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.num_agents to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.num_agents` for environment variables or `env.get_wrapper_attr('num_agents')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.is_multiagent to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.is_multiagent` for environment variables or `env.get_wrapper_attr('is_multiagent')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "\u001b[36m[2023-09-14 14:36:36,452][63770] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,455][63770] Port 40700 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,456][63770] Using port 40700\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,209][39697] Using port 40400 on host...\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.num_agents to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.num_agents` for environment variables or `env.get_wrapper_attr('num_agents')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.is_multiagent to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.is_multiagent` for environment variables or `env.get_wrapper_attr('is_multiagent')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "\u001b[36m[2023-09-14 14:36:36,456][63771] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,459][63771] Port 40800 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,460][63771] Using port 40800\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,210][39699] Using port 40800 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,212][39696] Initializing env for player 1, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,214][39734] Initializing env for player 1, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,217][39699] Initializing env for player 1, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,219][39697] Initializing env for player 1, init_info: {'port': 40400}...\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.num_agents to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.num_agents` for environment variables or `env.get_wrapper_attr('num_agents')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.is_multiagent to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.is_multiagent` for environment variables or `env.get_wrapper_attr('is_multiagent')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "\u001b[36m[2023-09-14 14:36:36,474][63735] Port 40301 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,474][63735] Using port 40301\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,476][63735] Using port 40300 on host...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,479][63734] Port 40401 is available\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:36,479][63806] UDP port 41001 cannot be used [Errno 98] Address already in use\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,479][63734] Using port 40401\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,479][63806] Port 42001 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,479][63806] Using port 42001\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,480][63769] Port 40601 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,480][63769] Using port 40601\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,480][63734] Using port 40400 on host...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,481][63767] Port 40501 is available\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,481][63806] Using port 42000 on host...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,481][63767] Using port 40501\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,482][63769] Using port 40600 on host...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,482][63805] Port 40901 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,482][63805] Using port 40901\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,482][63767] Using port 40500 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,484][63805] Using port 40900 on host...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,486][63770] Port 40701 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,486][63770] Using port 40701\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,488][63770] Using port 40700 on host...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,506][63771] Port 40801 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:36,507][63771] Using port 40801\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,509][63771] Using port 40800 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,770][63806] Initialized w:7 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,772][63806] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,773][63806] Using port 42001 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,778][63769] Initialized w:3 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,778][63805] Initialized w:6 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,779][63767] Initialized w:2 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,780][63805] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,780][63769] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,781][63767] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,782][63805] Using port 40901 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,782][63769] Using port 40601 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,783][63767] Using port 40501 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,794][63771] Initialized w:5 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,796][63771] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,797][63771] Using port 40801 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,840][63735] Initialized w:0 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,842][63735] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,843][63735] Using port 40301 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,845][63734] Initialized w:1 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,847][63734] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,848][63734] Using port 40401 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,852][63770] Initialized w:4 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,854][63770] Decorrelating experience for 0 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:36,855][63770] Using port 40701 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,065][63767] Initialized w:2 v:1 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,065][63769] Initialized w:3 v:1 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,066][63767] Decorrelating experience for 32 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,067][63769] Decorrelating experience for 32 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,069][63805] Initialized w:6 v:1 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,070][63805] Decorrelating experience for 32 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,094][63771] Initialized w:5 v:1 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,095][63771] Decorrelating experience for 32 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,095][63806] Initialized w:7 v:1 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,097][63806] Decorrelating experience for 32 frames...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,151][63767] Port 40502 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,151][63767] Using port 40502\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,162][63805] Port 40902 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,162][63805] Using port 40902\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,176][63769] Port 40602 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,176][63769] Using port 40602\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,181][63767] Port 40503 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,181][63767] Using port 40503\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,183][63767] Using port 40502 on host...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,183][63771] Port 40802 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,183][63771] Using port 40802\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,190][63805] Port 40903 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,191][63805] Using port 40903\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,192][63805] Using port 40902 on host...\u001b[0m\n", + "\u001b[33m[2023-09-14 14:36:37,201][63806] UDP port 41002 cannot be used [Errno 98] Address already in use\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,201][63806] Port 42002 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,201][63806] Using port 42002\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,212][63771] Port 40803 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,213][63771] Using port 40803\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,214][63771] Using port 40802 on host...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,221][63769] Port 40603 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,221][63769] Using port 40603\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,224][63769] Using port 40602 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,239][63735] Initialized w:0 v:1 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,241][63735] Decorrelating experience for 32 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,246][63734] Initialized w:1 v:1 player:0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,247][63806] Port 41003 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,247][63806] Using port 41003\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,246][63770] Initialized w:4 v:1 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,247][63734] Decorrelating experience for 32 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,249][63806] Using port 42002 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,249][63770] Decorrelating experience for 32 frames...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,331][63735] Port 40302 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,331][63735] Using port 40302\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,343][63770] Port 40702 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,344][63770] Using port 40702\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,356][63734] Port 40402 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,357][63734] Using port 40402\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,360][63735] Port 40303 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,360][63735] Using port 40303\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,362][63735] Using port 40302 on host...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,376][63770] Port 40703 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,376][63770] Using port 40703\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,378][63770] Using port 40702 on host...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,402][63734] Port 40403 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,402][63734] Using port 40403\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,404][63734] Using port 40402 on host...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:37,459][109198] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 0. Throughput: 0: nan, 1: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,479][63805] Initialized w:6 v:2 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,480][63805] Decorrelating experience for 64 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,525][63767] Initialized w:2 v:2 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,526][63767] Decorrelating experience for 64 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,559][63769] Initialized w:3 v:2 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,561][63769] Decorrelating experience for 64 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,594][63805] Using port 40903 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,625][63767] Using port 40503 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,669][63806] Initialized w:7 v:2 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,670][63806] Decorrelating experience for 64 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,687][63769] Using port 40603 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,692][63771] Initialized w:5 v:2 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,694][63771] Decorrelating experience for 64 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,732][63735] Initialized w:0 v:2 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,733][63735] Decorrelating experience for 64 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,784][63806] Using port 41003 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,804][63771] Using port 40803 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,828][63770] Initialized w:4 v:2 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,830][63770] Decorrelating experience for 64 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,844][63735] Using port 40303 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,862][63734] Initialized w:1 v:2 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,865][63734] Decorrelating experience for 64 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,895][63805] Initialized w:6 v:3 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,897][63805] Decorrelating experience for 96 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,899][63767] Initialized w:2 v:3 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,900][63767] Decorrelating experience for 96 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,934][63770] Using port 40703 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,974][63769] Initialized w:3 v:3 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,976][63769] Decorrelating experience for 96 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:37,994][63734] Using port 40403 on host...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:38,077][63806] Initialized w:7 v:3 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:38,079][63806] Decorrelating experience for 96 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:38,101][63771] Initialized w:5 v:3 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:38,103][63771] Decorrelating experience for 96 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:38,132][63735] Initialized w:0 v:3 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:38,134][63735] Decorrelating experience for 96 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:38,269][63770] Initialized w:4 v:3 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:38,271][63770] Decorrelating experience for 96 frames...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:38,386][63734] Initialized w:1 v:3 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:38,387][63734] Decorrelating experience for 96 frames...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:39,962][63454] Signal inference workers to stop experience collection...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:39,965][63733] InferenceWorker_p1-w0: stopping experience collection\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:39,969][63732] InferenceWorker_p0-w0: stopping experience collection\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/torch/nn/modules/module.py:1501: UserWarning: operator() profile_node %43 : int[] = prim::profile_ivalue(%axis.1)\n", + " does not have profile information (Triggered internally at ../third_party/nvfuser/csrc/graph_fuser.cpp:104.)\n", + " return forward_call(*args, **kwargs)\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/torch/nn/modules/module.py:1501: UserWarning: operator() profile_node %43 : int[] = prim::profile_ivalue(%axis.1)\n", + " does not have profile information (Triggered internally at ../third_party/nvfuser/csrc/graph_fuser.cpp:104.)\n", + " return forward_call(*args, **kwargs)\n", + "\u001b[36m[2023-09-14 14:36:42,458][109198] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 502.6, 1: 300.2. Samples: 4014. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:42,857][63454] Signal inference workers to resume experience collection...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:42,858][63732] InferenceWorker_p0-w0: resuming experience collection\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:42,858][63733] InferenceWorker_p1-w0: resuming experience collection\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:45,350][63576] Signal inference workers to stop experience collection...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:45,687][63576] Signal inference workers to resume experience collection...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:47,458][109198] Fps is (10 sec: 4505.7, 60 sec: 4505.7, 300 sec: 4505.7). Total num frames: 45056. Throughput: 0: 469.3, 1: 333.2. Samples: 8025. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:48,781][63732] Updated weights for policy 0, policy_version 10 (0.0700)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:49,727][109198] Heartbeat connected on Batcher_0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:49,730][109198] Heartbeat connected on LearnerWorker_p0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:49,734][109198] Heartbeat connected on Batcher_1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:49,737][109198] Heartbeat connected on LearnerWorker_p1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:49,748][109198] Heartbeat connected on InferenceWorker_p0-w0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:49,751][109198] Heartbeat connected on RolloutWorker_w0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:49,753][109198] Heartbeat connected on InferenceWorker_p1-w0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:49,756][109198] Heartbeat connected on RolloutWorker_w1\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:49,757][109198] Heartbeat connected on RolloutWorker_w2\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:49,761][109198] Heartbeat connected on RolloutWorker_w3\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:49,767][109198] Heartbeat connected on RolloutWorker_w4\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:49,769][109198] Heartbeat connected on RolloutWorker_w5\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:49,777][109198] Heartbeat connected on RolloutWorker_w6\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:49,779][109198] Heartbeat connected on RolloutWorker_w7\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:52,458][109198] Fps is (10 sec: 10240.1, 60 sec: 6826.8, 300 sec: 6826.8). Total num frames: 102400. Throughput: 0: 972.9, 1: 619.8. Samples: 23890. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:52,631][63733] Updated weights for policy 1, policy_version 10 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:36:54,671][63732] Updated weights for policy 0, policy_version 20 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:36:57,458][109198] Fps is (10 sec: 11468.8, 60 sec: 7987.3, 300 sec: 7987.3). Total num frames: 159744. Throughput: 0: 1250.4, 1: 781.0. Samples: 40627. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:00,489][63732] Updated weights for policy 0, policy_version 30 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:02,288][63733] Updated weights for policy 1, policy_version 20 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:02,458][109198] Fps is (10 sec: 11468.6, 60 sec: 8683.6, 300 sec: 8683.6). Total num frames: 217088. Throughput: 0: 1209.5, 1: 750.4. Samples: 48998. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:03,460][63734] DAMAGECOUNT value on done: 10.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:03,598][63734] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:03,754][63770] DAMAGECOUNT value on done: 15.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:03,755][63770] Sum rewards: -8.078, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.156', 'AMMO5': '0.005', 'AMMO2': '0.011', 'weapon4': '0.014', 'HITCOUNT': '0.020', 'weapon5': '0.026', 'DAMAGECOUNT': '0.045', 'ARMOR': '0.048', 'AMMO4': '0.054', 'AMMO3': '0.096', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.500', 'weapon3': '0.534', 'FRAGCOUNT': '1.000', 'weapon2': '1.026'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:03,781][63734] DAMAGECOUNT value on done: 46.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:04,094][63770] DAMAGECOUNT value on done: 20.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:04,095][63770] Sum rewards: -5.467, reward structure: {'DEATHCOUNT': '-6.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.318', 'AMMO5': '0.003', 'AMMO2': '0.003', 'AMMO4': '0.015', 'HITCOUNT': '0.020', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'DAMAGECOUNT': '0.060', 'AMMO3': '0.067', 'WEAPON5': '0.100', 'weapon5': '0.106', 'ARMOR': '0.116', 'weapon4': '0.124', 'WEAPON3': '0.350', 'weapon3': '0.498', 'weapon2': '0.818'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:04,866][63805] DAMAGECOUNT value on done: 35.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:05,004][63805] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:05,121][63806] DAMAGECOUNT value on done: 25.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:05,140][63735] DAMAGECOUNT value on done: 15.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:05,256][63806] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:05,257][63805] DAMAGECOUNT value on done: 15.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:05,281][63735] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:05,424][63771] DAMAGECOUNT value on done: 35.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:05,425][63771] Sum rewards: -5.664, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.012', 'AMMO2': '0.000', 'AMMO4': '0.000', 'HITCOUNT': '0.040', 'DAMAGECOUNT': '0.105', 'AMMO3': '0.106', 'WEAPON3': '0.450', 'weapon2': '0.812', 'weapon3': '0.834', 'FRAGCOUNT': '1.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:05,523][63806] DAMAGECOUNT value on done: 218.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:05,523][63806] Sum rewards: -4.069, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.198', 'AMMO2': '0.002', 'AMMO5': '0.003', 'AMMO4': '0.011', 'weapon5': '0.038', 'WEAPON5': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.133', 'DAMAGECOUNT': '0.654', 'WEAPON3': '0.700', 'weapon2': '0.784', 'weapon3': '0.944', 'FRAGCOUNT': '1.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:05,574][63771] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:05,589][63735] DAMAGECOUNT value on done: 15.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:05,605][63805] DAMAGECOUNT value on done: 150.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:05,606][63805] Sum rewards: -3.372, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.595', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO4': '0.026', 'ARMOR': '0.028', 'weapon4': '0.074', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.103', 'HITCOUNT': '0.150', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.600', 'weapon3': '0.786', 'weapon2': '0.796', 'FRAGCOUNT': '1.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:05,837][63771] DAMAGECOUNT value on done: 5.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:06,006][63805] DAMAGECOUNT value on done: 40.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:06,039][63734] DAMAGECOUNT value on done: 15.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:06,355][63734] DAMAGECOUNT value on done: 7.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:06,377][63767] DAMAGECOUNT value on done: 85.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:06,500][63767] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:06,623][63732] Updated weights for policy 0, policy_version 40 (0.0014)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:06,703][63769] DAMAGECOUNT value on done: 173.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:06,744][63767] DAMAGECOUNT value on done: 65.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:06,745][63767] Sum rewards: -2.545, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.475', 'AMMO2': '0.006', 'AMMO4': '0.028', 'WEAPON4': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.107', 'ARMOR': '0.116', 'weapon4': '0.168', 'DAMAGECOUNT': '0.195', 'WEAPON3': '0.500', 'weapon3': '0.786', 'weapon2': '0.914', 'FRAGCOUNT': '1.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:06,887][63806] DAMAGECOUNT value on done: 175.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:06,888][63806] Sum rewards: -7.130, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.074', 'AMMO5': '0.003', 'AMMO2': '0.005', 'weapon5': '0.010', 'AMMO4': '0.023', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'weapon4': '0.064', 'HITCOUNT': '0.110', 'AMMO3': '0.186', 'DAMAGECOUNT': '0.525', 'weapon2': '0.600', 'weapon3': '0.628', 'WEAPON3': '0.900', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,035][63769] DAMAGECOUNT value on done: 25.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,105][63767] DAMAGECOUNT value on done: 10.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,134][63735] DAMAGECOUNT value on done: 50.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,135][63735] Sum rewards: -6.700, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.710', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'HITCOUNT': '0.050', 'ARMOR': '0.060', 'DAMAGECOUNT': '0.150', 'AMMO3': '0.167', 'weapon3': '0.678', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.070'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,331][63806] DAMAGECOUNT value on done: 17.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,332][63806] Sum rewards: -9.517, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.022', 'AMMO2': '0.003', 'WEAPON1': '0.010', 'AMMO4': '0.016', 'HITCOUNT': '0.020', 'ARMOR': '0.028', 'WEAPON4': '0.050', 'DAMAGECOUNT': '0.051', 'weapon4': '0.066', 'AMMO3': '0.194', 'weapon3': '0.362', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.054'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,378][63771] DAMAGECOUNT value on done: 10.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,379][63771] Sum rewards: -5.850, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '0.002', 'AMMO5': '0.003', 'HITCOUNT': '0.010', 'AMMO2': '0.019', 'weapon5': '0.020', 'DAMAGECOUNT': '0.030', 'ARMOR': '0.041', 'WEAPON5': '0.050', 'AMMO3': '0.081', 'AMMO4': '0.096', 'WEAPON4': '0.150', 'weapon4': '0.178', 'WEAPON3': '0.450', 'weapon3': '0.496', 'weapon2': '0.774'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,457][63735] DAMAGECOUNT value on done: 0.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:07,458][109198] Fps is (10 sec: 11059.2, 60 sec: 9011.3, 300 sec: 9011.3). Total num frames: 270336. Throughput: 0: 1347.0, 1: 846.7. Samples: 65812. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:07,460][109198] Avg episode reward: [(0, '-6.331'), (1, '-6.765')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,463][63769] DAMAGECOUNT value on done: 130.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,464][63454] Saving new best policy, reward=-6.331!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,464][63576] Saving new best policy, reward=-6.765!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,546][63767] DAMAGECOUNT value on done: 0.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,625][63770] DAMAGECOUNT value on done: 55.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,625][63770] Sum rewards: -7.588, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.196', 'AMMO2': '0.016', 'WEAPON1': '0.020', 'weapon4': '0.026', 'ARMOR': '0.032', 'HITCOUNT': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.077', 'AMMO3': '0.146', 'DAMAGECOUNT': '0.165', 'weapon3': '0.742', 'WEAPON3': '0.800', 'weapon2': '0.984', 'FRAGCOUNT': '1.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,779][63771] DAMAGECOUNT value on done: 30.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,779][63771] Sum rewards: -5.993, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.352', 'AMMO4': '-0.008', 'AMMO2': '-0.002', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'HITCOUNT': '0.030', 'ARMOR': '0.036', 'DAMAGECOUNT': '0.090', 'AMMO3': '0.115', 'WEAPON3': '0.600', 'weapon3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.032'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:07,802][63770] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:07,938][63769] DAMAGECOUNT value on done: 55.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:08,049][63770] DAMAGECOUNT value on done: 90.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:08,049][63770] Sum rewards: -6.528, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.858', 'weapon5': '0.006', 'AMMO5': '0.007', 'AMMO2': '0.021', 'HITCOUNT': '0.080', 'weapon4': '0.100', 'AMMO4': '0.105', 'AMMO3': '0.132', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.270', 'weapon3': '0.418', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.040'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:08,085][63769] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:09,533][63733] Updated weights for policy 1, policy_version 30 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:12,458][109198] Fps is (10 sec: 11468.9, 60 sec: 9479.4, 300 sec: 9479.4). Total num frames: 331776. Throughput: 0: 1335.5, 1: 1024.1. Samples: 82588. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:12,460][109198] Avg episode reward: [(0, '-6.452'), (1, '-6.820')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:15,361][63733] Updated weights for policy 1, policy_version 40 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:16,143][63732] Updated weights for policy 0, policy_version 50 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:17,458][109198] Fps is (10 sec: 11468.7, 60 sec: 9625.6, 300 sec: 9625.6). Total num frames: 385024. Throughput: 0: 1250.5, 1: 1029.6. Samples: 91202. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:17,460][109198] Avg episode reward: [(0, '-6.452'), (1, '-6.820')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:19,253][63805] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:21,156][63733] Updated weights for policy 1, policy_version 50 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:22,458][109198] Fps is (10 sec: 11059.2, 60 sec: 9830.5, 300 sec: 9830.5). Total num frames: 442368. Throughput: 0: 1254.8, 1: 1150.7. Samples: 108247. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:22,460][109198] Avg episode reward: [(0, '-6.452'), (1, '-6.820')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:25,759][63732] Updated weights for policy 0, policy_version 60 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:26,940][63733] Updated weights for policy 1, policy_version 60 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:27,460][109198] Fps is (10 sec: 11057.5, 60 sec: 9912.1, 300 sec: 9912.1). Total num frames: 495616. Throughput: 0: 1339.5, 1: 1353.3. Samples: 125197. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:27,461][109198] Avg episode reward: [(0, '-6.452'), (1, '-6.820')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:27,670][63770] DAMAGECOUNT value on done: 20.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:27,671][63770] Sum rewards: -11.475, reward structure: {'DEATHCOUNT': '-11.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.470', 'AMMO5': '0.003', 'weapon5': '0.006', 'HITCOUNT': '0.010', 'AMMO2': '0.011', 'DAMAGECOUNT': '0.015', 'WEAPON1': '0.020', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.053', 'AMMO3': '0.113', 'weapon4': '0.148', 'weapon3': '0.404', 'WEAPON3': '0.550', 'weapon2': '1.312'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:27,794][63806] DAMAGECOUNT value on done: 25.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:27,795][63806] Sum rewards: -10.169, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.638', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.003', 'AMMO2': '0.015', 'weapon5': '0.016', 'weapon4': '0.034', 'ARMOR': '0.048', 'WEAPON5': '0.050', 'AMMO4': '0.075', 'WEAPON4': '0.100', 'AMMO3': '0.134', 'weapon3': '0.492', 'WEAPON3': '0.700', 'weapon2': '1.052'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:28,074][63770] DAMAGECOUNT value on done: 20.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:28,194][63806] DAMAGECOUNT value on done: 343.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:28,195][63806] Sum rewards: -6.892, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.150', 'AMMO5': '0.007', 'AMMO2': '0.012', 'weapon4': '0.012', 'ARMOR': '0.016', 'WEAPON1': '0.020', 'AMMO4': '0.059', 'HITCOUNT': '0.070', 'AMMO3': '0.099', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.550', 'weapon3': '0.660', 'FRAGCOUNT': '1.000', 'weapon2': '1.128'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:28,618][63805] DAMAGECOUNT value on done: 50.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:28,665][63734] DAMAGECOUNT value on done: 295.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:28,792][63734] DAMAGECOUNT value on done: 20.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:29,002][63805] DAMAGECOUNT value on done: 15.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:29,052][63734] DAMAGECOUNT value on done: 56.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:29,111][63735] DAMAGECOUNT value on done: 80.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:29,144][63734] DAMAGECOUNT value on done: 57.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:29,317][63771] DAMAGECOUNT value on done: 185.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:29,318][63771] Sum rewards: -6.046, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.970', 'AMMO5': '0.005', 'AMMO2': '0.005', 'weapon5': '0.006', 'weapon4': '0.014', 'AMMO4': '0.025', 'ARMOR': '0.055', 'HITCOUNT': '0.090', 'AMMO3': '0.095', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.500', 'weapon3': '0.582', 'FRAGCOUNT': '1.000', 'weapon2': '1.146'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:29,576][63735] DAMAGECOUNT value on done: 30.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:29,669][63806] DAMAGECOUNT value on done: 190.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:29,752][63735] DAMAGECOUNT value on done: 132.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:29,752][63735] Sum rewards: -7.148, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.382', 'AMMO2': '0.003', 'AMMO4': '0.016', 'weapon4': '0.038', 'WEAPON4': '0.050', 'HITCOUNT': '0.080', 'AMMO3': '0.154', 'DAMAGECOUNT': '0.351', 'ARMOR': '0.476', 'weapon3': '0.502', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.264'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:29,763][63771] DAMAGECOUNT value on done: 5.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:30,085][63806] DAMAGECOUNT value on done: 42.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:30,101][63735] DAMAGECOUNT value on done: 35.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:30,101][63767] DAMAGECOUNT value on done: 173.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:30,101][63735] Sum rewards: -8.929, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.084', 'AMMO5': '0.007', 'HITCOUNT': '0.010', 'AMMO2': '0.017', 'WEAPON1': '0.020', 'weapon5': '0.042', 'DAMAGECOUNT': '0.060', 'AMMO4': '0.083', 'AMMO3': '0.094', 'ARMOR': '0.104', 'weapon4': '0.144', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon3': '0.376', 'WEAPON3': '0.500', 'weapon2': '0.898'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:30,180][63771] DAMAGECOUNT value on done: 10.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:30,416][63767] DAMAGECOUNT value on done: 180.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:30,417][63767] Sum rewards: -5.813, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.600', 'weapon5': '0.002', 'AMMO2': '0.007', 'ARMOR': '0.012', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.037', 'HITCOUNT': '0.060', 'AMMO3': '0.172', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.345', 'weapon3': '0.714', 'WEAPON3': '0.900', 'weapon2': '1.052', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:30,634][63771] DAMAGECOUNT value on done: 190.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:30,634][63771] Sum rewards: -10.164, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.192', 'ARMOR': '0.020', 'AMMO2': '0.022', 'WEAPON4': '0.100', 'AMMO4': '0.109', 'HITCOUNT': '0.120', 'AMMO3': '0.209', 'DAMAGECOUNT': '0.480', 'weapon3': '0.698', 'weapon2': '0.970', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:30,730][63805] DAMAGECOUNT value on done: 240.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:30,731][63805] Sum rewards: -9.086, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.516', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.010', 'weapon5': '0.020', 'AMMO2': '0.023', 'weapon4': '0.032', 'ARMOR': '0.040', 'HITCOUNT': '0.090', 'AMMO4': '0.117', 'AMMO3': '0.130', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.700', 'weapon3': '0.714', 'weapon2': '1.184'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:31,059][63805] DAMAGECOUNT value on done: 335.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:31,060][63805] Sum rewards: -4.074, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.136', 'ARMOR': '0.004', 'AMMO2': '0.016', 'weapon4': '0.032', 'AMMO4': '0.078', 'HITCOUNT': '0.110', 'AMMO3': '0.139', 'WEAPON4': '0.150', 'weapon3': '0.626', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.885', 'weapon2': '1.272', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:31,574][63769] DAMAGECOUNT value on done: 135.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:31,989][63769] DAMAGECOUNT value on done: 65.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:32,122][63767] DAMAGECOUNT value on done: 70.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:32,138][63769] DAMAGECOUNT value on done: 254.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:32,139][63769] Sum rewards: -2.667, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO2': '0.018', 'ARMOR': '0.032', 'HITCOUNT': '0.070', 'AMMO4': '0.087', 'WEAPON4': '0.100', 'weapon4': '0.122', 'AMMO3': '0.125', 'DAMAGECOUNT': '0.243', 'HEALTH': '0.300', 'WEAPON3': '0.650', 'weapon3': '0.890', 'weapon2': '0.946', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:32,459][109198] Fps is (10 sec: 11058.9, 60 sec: 10053.8, 300 sec: 10053.8). Total num frames: 552960. Throughput: 0: 1362.9, 1: 1417.8. Samples: 133158. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:32,461][109198] Avg episode reward: [(0, '-6.969'), (1, '-7.181')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:32,486][63767] DAMAGECOUNT value on done: 66.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:32,571][63769] DAMAGECOUNT value on done: 54.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:32,865][63770] DAMAGECOUNT value on done: 70.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:33,086][63733] Updated weights for policy 1, policy_version 70 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:33,254][63770] DAMAGECOUNT value on done: 140.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:33,255][63770] Sum rewards: -7.999, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.638', 'AMMO2': '0.020', 'HITCOUNT': '0.050', 'weapon4': '0.062', 'AMMO4': '0.099', 'WEAPON4': '0.100', 'AMMO3': '0.106', 'DAMAGECOUNT': '0.150', 'weapon3': '0.404', 'WEAPON3': '0.450', 'ARMOR': '0.488', 'FRAGCOUNT': '1.000', 'weapon2': '1.210'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:34,909][63732] Updated weights for policy 0, policy_version 70 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:37,458][109198] Fps is (10 sec: 11061.0, 60 sec: 10103.5, 300 sec: 10103.5). Total num frames: 606208. Throughput: 0: 1290.4, 1: 1501.8. Samples: 149539. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:37,460][109198] Avg episode reward: [(0, '-6.882'), (1, '-7.197')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:39,339][63733] Updated weights for policy 1, policy_version 80 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:42,458][109198] Fps is (10 sec: 11059.5, 60 sec: 11059.2, 300 sec: 10208.5). Total num frames: 663552. Throughput: 0: 1206.2, 1: 1576.1. Samples: 165833. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:42,460][109198] Avg episode reward: [(0, '-6.882'), (1, '-7.197')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:44,104][63732] Updated weights for policy 0, policy_version 80 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:45,714][63733] Updated weights for policy 1, policy_version 90 (0.0013)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:47,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11195.7, 300 sec: 10240.0). Total num frames: 716800. Throughput: 0: 1163.5, 1: 1615.8. Samples: 174069. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:47,460][109198] Avg episode reward: [(0, '-6.882'), (1, '-7.197')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:51,961][63733] Updated weights for policy 1, policy_version 100 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:52,135][63771] DAMAGECOUNT value on done: 220.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:52,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11195.7, 300 sec: 10322.0). Total num frames: 774144. Throughput: 0: 1088.3, 1: 1685.2. Samples: 190619. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:52,460][109198] Avg episode reward: [(0, '-6.891'), (1, '-7.197')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:52,475][63734] DAMAGECOUNT value on done: 335.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:52,499][63805] DAMAGECOUNT value on done: 60.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:52,525][63771] DAMAGECOUNT value on done: 42.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:52,885][63734] DAMAGECOUNT value on done: 106.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:52,912][63805] DAMAGECOUNT value on done: 85.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:53,247][63806] DAMAGECOUNT value on done: 106.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:53,366][63732] Updated weights for policy 0, policy_version 90 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:53,471][63770] DAMAGECOUNT value on done: 35.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:53,546][63767] DAMAGECOUNT value on done: 260.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:53,630][63806] DAMAGECOUNT value on done: 373.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:53,714][63771] DAMAGECOUNT value on done: 18.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:53,828][63770] DAMAGECOUNT value on done: 155.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:53,828][63770] Sum rewards: -7.221, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.253', 'AMMO5': '0.003', 'weapon5': '0.004', 'AMMO2': '0.024', 'WEAPON5': '0.050', 'ARMOR': '0.076', 'HITCOUNT': '0.080', 'weapon4': '0.106', 'AMMO4': '0.117', 'AMMO3': '0.153', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.405', 'weapon3': '0.558', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.156'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:53,957][63767] DAMAGECOUNT value on done: 225.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:53,957][63767] Sum rewards: -1.925, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.155', 'AMMO5': '0.007', 'AMMO2': '0.020', 'weapon5': '0.028', 'HITCOUNT': '0.050', 'WEAPON5': '0.050', 'weapon4': '0.070', 'ARMOR': '0.085', 'AMMO4': '0.097', 'AMMO3': '0.121', 'DAMAGECOUNT': '0.135', 'WEAPON4': '0.200', 'weapon3': '0.546', 'WEAPON3': '0.650', 'weapon2': '1.170', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:54,094][63771] DAMAGECOUNT value on done: 217.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:54,286][63734] DAMAGECOUNT value on done: 35.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:54,761][63735] DAMAGECOUNT value on done: 100.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:54,773][63734] DAMAGECOUNT value on done: 162.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:54,774][63734] Sum rewards: -6.917, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.010', 'AMMO2': '0.020', 'ARMOR': '0.024', 'WEAPON1': '0.030', 'weapon4': '0.032', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.102', 'AMMO3': '0.124', 'DAMAGECOUNT': '0.315', 'weapon3': '0.606', 'WEAPON3': '0.650', 'weapon2': '1.240', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:54,820][63767] DAMAGECOUNT value on done: 155.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:54,821][63767] Sum rewards: -5.440, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.668', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'ARMOR': '0.052', 'HITCOUNT': '0.060', 'AMMO3': '0.135', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.550', 'weapon3': '0.706', 'weapon2': '0.992', 'FRAGCOUNT': '1.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:55,127][63735] DAMAGECOUNT value on done: 107.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:55,128][63735] Sum rewards: -6.089, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.822', 'AMMO2': '0.013', 'HITCOUNT': '0.060', 'AMMO4': '0.062', 'WEAPON4': '0.100', 'AMMO3': '0.107', 'weapon4': '0.124', 'DAMAGECOUNT': '0.231', 'weapon3': '0.398', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon2': '1.188'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:55,178][63806] DAMAGECOUNT value on done: 270.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:55,214][63767] DAMAGECOUNT value on done: 71.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:55,246][63735] DAMAGECOUNT value on done: 132.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:55,535][63806] DAMAGECOUNT value on done: 56.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:55,628][63735] DAMAGECOUNT value on done: 200.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:55,628][63735] Sum rewards: -6.599, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.222', 'AMMO2': '0.001', 'AMMO5': '0.003', 'AMMO4': '0.006', 'WEAPON5': '0.050', 'ARMOR': '0.080', 'HITCOUNT': '0.080', 'AMMO3': '0.182', 'DAMAGECOUNT': '0.495', 'weapon3': '0.872', 'WEAPON3': '0.950', 'weapon2': '1.154', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:56,178][63769] DAMAGECOUNT value on done: 339.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:56,339][63805] DAMAGECOUNT value on done: 265.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:56,340][63805] Sum rewards: -8.041, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.003', 'AMMO2': '0.014', 'HITCOUNT': '0.020', 'weapon5': '0.032', 'WEAPON5': '0.050', 'AMMO4': '0.072', 'DAMAGECOUNT': '0.075', 'ARMOR': '0.088', 'weapon4': '0.090', 'AMMO3': '0.128', 'WEAPON4': '0.150', 'weapon3': '0.370', 'HEALTH': '0.463', 'WEAPON3': '0.600', 'weapon2': '1.054'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:56,589][63769] DAMAGECOUNT value on done: 89.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:56,654][63805] DAMAGECOUNT value on done: 340.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:57,376][63769] DAMAGECOUNT value on done: 269.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:57,422][63771] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:57,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11127.5, 300 sec: 10342.4). Total num frames: 827392. Throughput: 0: 1106.0, 1: 1648.4. Samples: 206533. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:37:57,460][109198] Avg episode reward: [(0, '-6.674'), (1, '-6.883')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:57,762][63769] DAMAGECOUNT value on done: 90.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:58,745][63770] DAMAGECOUNT value on done: 115.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:58,997][63733] Updated weights for policy 1, policy_version 110 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:59,116][63770] DAMAGECOUNT value on done: 245.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:37:59,116][63770] Sum rewards: -6.528, reward structure: {'DEATHCOUNT': '-10.500', 'AMMO5': '0.003', 'AMMO2': '0.015', 'weapon5': '0.024', 'HEALTH': '0.042', 'WEAPON5': '0.050', 'weapon4': '0.054', 'HITCOUNT': '0.060', 'AMMO4': '0.073', 'ARMOR': '0.076', 'WEAPON4': '0.100', 'AMMO3': '0.107', 'DAMAGECOUNT': '0.315', 'weapon3': '0.402', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon2': '1.152'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:00,800][63732] Updated weights for policy 0, policy_version 100 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:02,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11127.5, 300 sec: 10408.7). Total num frames: 884736. Throughput: 0: 1128.8, 1: 1620.4. Samples: 214914. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:02,459][109198] Avg episode reward: [(0, '-6.604'), (1, '-6.799')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:06,215][63733] Updated weights for policy 1, policy_version 120 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:07,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11195.7, 300 sec: 10467.6). Total num frames: 942080. Throughput: 0: 1175.3, 1: 1576.3. Samples: 232069. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:07,460][109198] Avg episode reward: [(0, '-6.604'), (1, '-6.799')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:08,040][63732] Updated weights for policy 0, policy_version 110 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:12,458][109198] Fps is (10 sec: 11468.6, 60 sec: 11127.4, 300 sec: 10520.3). Total num frames: 999424. Throughput: 0: 1221.7, 1: 1526.4. Samples: 248854. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:12,460][109198] Avg episode reward: [(0, '-6.604'), (1, '-6.799')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:13,497][63733] Updated weights for policy 1, policy_version 130 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:15,314][63732] Updated weights for policy 0, policy_version 120 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:15,812][63734] DAMAGECOUNT value on done: 425.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:16,035][63805] DAMAGECOUNT value on done: 150.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:16,036][63805] Sum rewards: -6.780, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.430', 'ARMOR': '0.004', 'AMMO2': '0.020', 'HITCOUNT': '0.070', 'AMMO4': '0.101', 'AMMO3': '0.134', 'WEAPON4': '0.150', 'weapon4': '0.152', 'DAMAGECOUNT': '0.270', 'weapon3': '0.672', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.126'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:16,195][63734] DAMAGECOUNT value on done: 116.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:16,421][63805] DAMAGECOUNT value on done: 186.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:16,865][63735] DAMAGECOUNT value on done: 125.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:17,203][63771] DAMAGECOUNT value on done: 53.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:17,204][63771] Sum rewards: -6.894, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.376', 'AMMO5': '0.005', 'ARMOR': '0.008', 'AMMO2': '0.009', 'HITCOUNT': '0.030', 'AMMO4': '0.044', 'weapon5': '0.054', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.105', 'AMMO3': '0.143', 'WEAPON3': '0.750', 'weapon3': '0.794', 'FRAGCOUNT': '1.000', 'weapon2': '1.090'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:17,254][63735] DAMAGECOUNT value on done: 156.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:17,365][63735] DAMAGECOUNT value on done: 202.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:17,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11127.5, 300 sec: 10526.7). Total num frames: 1052672. Throughput: 0: 1244.1, 1: 1516.9. Samples: 257400. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:17,460][109198] Avg episode reward: [(0, '-6.590'), (1, '-6.868')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:17,541][63771] DAMAGECOUNT value on done: 217.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:17,572][63734] DAMAGECOUNT value on done: 65.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:17,711][63771] DAMAGECOUNT value on done: 399.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:17,712][63771] Sum rewards: -2.728, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.346', 'weapon5': '0.002', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'AMMO4': '0.053', 'AMMO3': '0.066', 'WEAPON4': '0.100', 'HITCOUNT': '0.150', 'weapon4': '0.172', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.537', 'weapon3': '0.726', 'FRAGCOUNT': '1.000', 'weapon2': '1.096'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:17,736][63735] DAMAGECOUNT value on done: 250.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:17,737][63735] Sum rewards: -7.699, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.351', 'AMMO2': '0.003', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO4': '0.014', 'HITCOUNT': '0.050', 'weapon5': '0.054', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.150', 'AMMO3': '0.161', 'WEAPON3': '0.750', 'weapon3': '0.788', 'weapon2': '1.064'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:17,802][63806] DAMAGECOUNT value on done: 365.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:17,802][63806] Sum rewards: -5.291, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.145', 'AMMO2': '0.004', 'AMMO5': '0.005', 'AMMO4': '0.021', 'weapon4': '0.042', 'HITCOUNT': '0.050', 'AMMO3': '0.091', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.285', 'ARMOR': '0.445', 'WEAPON3': '0.450', 'weapon3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.060'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:17,899][63734] DAMAGECOUNT value on done: 177.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:17,899][63734] Sum rewards: -8.221, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.176', 'AMMO5': '0.003', 'weapon4': '0.006', 'HITCOUNT': '0.010', 'weapon5': '0.010', 'AMMO2': '0.015', 'DAMAGECOUNT': '0.045', 'WEAPON5': '0.050', 'AMMO4': '0.073', 'WEAPON4': '0.100', 'AMMO3': '0.121', 'ARMOR': '0.478', 'WEAPON3': '0.650', 'weapon3': '0.814', 'weapon2': '1.080'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:18,045][63771] DAMAGECOUNT value on done: 249.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:18,045][63771] Sum rewards: -4.517, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.964', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'AMMO2': '0.012', 'weapon5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.058', 'WEAPON5': '0.100', 'AMMO3': '0.106', 'weapon4': '0.122', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.621', 'weapon3': '0.778', 'weapon2': '0.950'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:18,099][63806] DAMAGECOUNT value on done: 141.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:18,099][63806] Sum rewards: -7.399, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.285', 'AMMO2': '0.003', 'AMMO5': '0.005', 'weapon4': '0.008', 'AMMO4': '0.014', 'weapon5': '0.020', 'HITCOUNT': '0.030', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.105', 'AMMO3': '0.136', 'ARMOR': '0.443', 'WEAPON3': '0.600', 'weapon3': '0.822', 'FRAGCOUNT': '1.000', 'weapon2': '1.050'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:18,141][63806] DAMAGECOUNT value on done: 126.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:18,191][63767] DAMAGECOUNT value on done: 210.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:18,513][63767] DAMAGECOUNT value on done: 103.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:18,514][63767] Sum rewards: -11.440, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-3.000', 'HEALTH': '-1.920', 'AMMO5': '0.009', 'HITCOUNT': '0.030', 'AMMO2': '0.031', 'weapon5': '0.036', 'DAMAGECOUNT': '0.096', 'ARMOR': '0.100', 'AMMO3': '0.127', 'AMMO4': '0.153', 'weapon4': '0.188', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'weapon3': '0.280', 'WEAPON3': '0.550', 'weapon2': '1.180'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:18,538][63806] DAMAGECOUNT value on done: 408.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:18,952][63770] DAMAGECOUNT value on done: 91.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:19,018][63767] DAMAGECOUNT value on done: 260.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:19,308][63770] DAMAGECOUNT value on done: 175.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:19,345][63767] DAMAGECOUNT value on done: 254.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:19,345][63767] Sum rewards: -5.554, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.903', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.008', 'AMMO2': '0.013', 'HITCOUNT': '0.020', 'weapon5': '0.022', 'ARMOR': '0.040', 'AMMO3': '0.049', 'AMMO4': '0.066', 'weapon4': '0.076', 'DAMAGECOUNT': '0.087', 'WEAPON5': '0.100', 'weapon3': '0.182', 'WEAPON4': '0.200', 'WEAPON3': '0.250', 'weapon2': '1.486'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:19,459][63769] DAMAGECOUNT value on done: 379.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:19,459][63769] Sum rewards: -7.474, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.610', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.007', 'AMMO2': '0.028', 'weapon5': '0.032', 'ARMOR': '0.040', 'HITCOUNT': '0.040', 'AMMO3': '0.093', 'DAMAGECOUNT': '0.120', 'AMMO4': '0.141', 'WEAPON5': '0.150', 'weapon4': '0.174', 'WEAPON4': '0.350', 'weapon3': '0.386', 'WEAPON3': '0.500', 'weapon2': '1.074'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:19,833][63769] DAMAGECOUNT value on done: 109.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:20,212][63733] Updated weights for policy 1, policy_version 140 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:21,724][63805] DAMAGECOUNT value on done: 335.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:21,725][63805] Sum rewards: -6.938, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.762', 'AMMO2': '0.009', 'WEAPON1': '0.020', 'AMMO4': '0.043', 'WEAPON4': '0.050', 'ARMOR': '0.086', 'HITCOUNT': '0.110', 'AMMO3': '0.184', 'DAMAGECOUNT': '0.210', 'weapon3': '0.832', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.030'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:22,081][63805] DAMAGECOUNT value on done: 507.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:22,082][63805] Sum rewards: -7.504, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.364', 'AMMO5': '0.005', 'AMMO2': '0.015', 'weapon4': '0.058', 'AMMO4': '0.077', 'WEAPON5': '0.100', 'HITCOUNT': '0.140', 'WEAPON4': '0.150', 'AMMO3': '0.174', 'DAMAGECOUNT': '0.501', 'weapon3': '0.746', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.344'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:22,117][63770] DAMAGECOUNT value on done: 115.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:22,458][109198] Fps is (10 sec: 11469.0, 60 sec: 11195.7, 300 sec: 10610.6). Total num frames: 1114112. Throughput: 0: 1268.8, 1: 1507.8. Samples: 274486. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:22,460][109198] Avg episode reward: [(0, '-6.647'), (1, '-6.768')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:22,503][63770] DAMAGECOUNT value on done: 255.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:22,689][63769] DAMAGECOUNT value on done: 284.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:23,040][63769] DAMAGECOUNT value on done: 120.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:23,041][63769] Sum rewards: -7.067, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.203', 'AMMO5': '0.003', 'AMMO2': '0.017', 'HITCOUNT': '0.020', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'WEAPON5': '0.050', 'weapon5': '0.052', 'AMMO3': '0.065', 'AMMO4': '0.087', 'DAMAGECOUNT': '0.090', 'weapon4': '0.114', 'WEAPON4': '0.150', 'weapon3': '0.258', 'WEAPON3': '0.300', 'weapon2': '1.374'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:23,325][63732] Updated weights for policy 0, policy_version 130 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:26,236][63733] Updated weights for policy 1, policy_version 150 (0.0013)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:27,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11196.0, 300 sec: 10612.4). Total num frames: 1167360. Throughput: 0: 1273.4, 1: 1515.6. Samples: 291335. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:27,459][109198] Avg episode reward: [(0, '-6.667'), (1, '-6.755')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:27,465][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000134_548864.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:27,465][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000151_618496.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:27,527][63576] Saving new best policy, reward=-6.755!\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:32,458][109198] Fps is (10 sec: 10649.6, 60 sec: 11127.5, 300 sec: 10614.0). Total num frames: 1220608. Throughput: 0: 1271.8, 1: 1507.9. Samples: 299152. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:32,459][109198] Avg episode reward: [(0, '-6.667'), (1, '-6.755')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:32,523][63732] Updated weights for policy 0, policy_version 140 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:32,773][63733] Updated weights for policy 1, policy_version 160 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:37,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11195.7, 300 sec: 10649.6). Total num frames: 1277952. Throughput: 0: 1271.4, 1: 1510.8. Samples: 315816. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:37,460][109198] Avg episode reward: [(0, '-6.667'), (1, '-6.755')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:39,026][63733] Updated weights for policy 1, policy_version 170 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:39,836][63734] DAMAGECOUNT value on done: 560.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:39,837][63734] Sum rewards: -5.073, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.735', 'AMMO5': '0.005', 'AMMO2': '0.014', 'AMMO4': '0.071', 'weapon4': '0.096', 'HITCOUNT': '0.120', 'AMMO3': '0.129', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.750', 'weapon3': '0.872', 'weapon2': '1.300', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:39,985][63735] DAMAGECOUNT value on done: 140.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:40,127][63805] DAMAGECOUNT value on done: 250.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:40,190][63734] DAMAGECOUNT value on done: 156.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:40,266][63735] DAMAGECOUNT value on done: 170.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:40,497][63805] DAMAGECOUNT value on done: 211.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:40,787][63767] DAMAGECOUNT value on done: 278.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:41,136][63767] DAMAGECOUNT value on done: 337.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:41,136][63767] Sum rewards: -5.157, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.267', 'weapon4': '0.008', 'AMMO2': '0.010', 'AMMO4': '0.052', 'AMMO3': '0.076', 'ARMOR': '0.076', 'WEAPON4': '0.100', 'HITCOUNT': '0.180', 'WEAPON3': '0.400', 'weapon3': '0.680', 'DAMAGECOUNT': '0.702', 'weapon2': '1.326', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:41,408][63771] DAMAGECOUNT value on done: 183.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:41,408][63771] Sum rewards: -5.230, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.572', 'AMMO2': '0.015', 'weapon7': '0.060', 'AMMO4': '0.077', 'HITCOUNT': '0.090', 'AMMO3': '0.144', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.256', 'DAMAGECOUNT': '0.390', 'weapon3': '0.706', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.084'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:41,529][63732] Updated weights for policy 0, policy_version 150 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:41,745][63771] DAMAGECOUNT value on done: 222.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:42,349][63735] DAMAGECOUNT value on done: 327.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:42,350][63735] Sum rewards: -3.193, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.058', 'AMMO2': '0.021', 'ARMOR': '0.055', 'HITCOUNT': '0.080', 'AMMO3': '0.095', 'AMMO4': '0.107', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.550', 'weapon3': '0.994', 'FRAGCOUNT': '1.000', 'weapon2': '1.138'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:42,397][63767] DAMAGECOUNT value on done: 295.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:42,397][63767] Sum rewards: -8.105, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.283', 'AMMO5': '0.005', 'AMMO2': '0.013', 'HITCOUNT': '0.030', 'ARMOR': '0.036', 'weapon4': '0.042', 'AMMO4': '0.063', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.105', 'WEAPON4': '0.150', 'AMMO3': '0.160', 'WEAPON3': '0.900', 'weapon3': '0.976', 'FRAGCOUNT': '1.000', 'weapon2': '1.098'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:42,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11195.7, 300 sec: 10682.4). Total num frames: 1335296. Throughput: 0: 1263.9, 1: 1533.3. Samples: 332407. Policy #0 lag: (min: 0.0, avg: 0.3, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:42,460][109198] Avg episode reward: [(0, '-6.660'), (1, '-6.679')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:42,461][63576] Saving new best policy, reward=-6.679!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:42,741][63806] DAMAGECOUNT value on done: 365.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:42,748][63735] DAMAGECOUNT value on done: 268.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:42,759][63767] DAMAGECOUNT value on done: 263.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:42,927][63734] DAMAGECOUNT value on done: 135.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:43,030][63806] DAMAGECOUNT value on done: 241.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:43,031][63806] Sum rewards: -8.499, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.934', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.016', 'HITCOUNT': '0.060', 'ARMOR': '0.068', 'AMMO4': '0.078', 'WEAPON5': '0.100', 'weapon4': '0.170', 'AMMO3': '0.175', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.300', 'weapon3': '0.576', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.028'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:43,076][63806] DAMAGECOUNT value on done: 136.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:43,287][63769] DAMAGECOUNT value on done: 429.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:43,368][63734] DAMAGECOUNT value on done: 177.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:43,398][63771] DAMAGECOUNT value on done: 418.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:43,399][63771] Sum rewards: -8.294, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.411', 'AMMO2': '0.008', 'weapon4': '0.012', 'HITCOUNT': '0.030', 'ARMOR': '0.040', 'AMMO4': '0.041', 'DAMAGECOUNT': '0.057', 'WEAPON4': '0.100', 'AMMO3': '0.121', 'WEAPON3': '0.650', 'weapon3': '0.692', 'FRAGCOUNT': '1.000', 'weapon2': '1.116'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:43,483][63806] DAMAGECOUNT value on done: 428.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:43,620][63769] DAMAGECOUNT value on done: 174.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:43,741][63771] DAMAGECOUNT value on done: 313.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:43,741][63771] Sum rewards: -7.338, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.518', 'AMMO2': '0.008', 'AMMO4': '0.037', 'HITCOUNT': '0.060', 'ARMOR': '0.064', 'WEAPON4': '0.100', 'weapon4': '0.166', 'AMMO3': '0.185', 'DAMAGECOUNT': '0.192', 'weapon3': '0.712', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.206'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:44,404][63770] DAMAGECOUNT value on done: 91.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:44,812][63770] DAMAGECOUNT value on done: 226.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:44,813][63770] Sum rewards: -7.279, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.290', 'AMMO2': '0.009', 'ARMOR': '0.020', 'AMMO4': '0.045', 'weapon4': '0.048', 'HITCOUNT': '0.070', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.153', 'AMMO3': '0.174', 'weapon3': '0.708', 'WEAPON3': '0.950', 'weapon2': '1.234', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:45,134][63733] Updated weights for policy 1, policy_version 180 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:45,268][63770] DAMAGECOUNT value on done: 205.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:45,268][63770] Sum rewards: -5.193, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.750', 'AMMO2': '0.015', 'HITCOUNT': '0.060', 'ARMOR': '0.064', 'AMMO4': '0.074', 'AMMO3': '0.110', 'weapon4': '0.146', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.270', 'weapon3': '0.452', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.066'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:45,603][63770] DAMAGECOUNT value on done: 315.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:45,603][63770] Sum rewards: -6.227, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.982', 'AMMO2': '0.002', 'AMMO5': '0.009', 'AMMO4': '0.011', 'weapon5': '0.016', 'WEAPON4': '0.050', 'ARMOR': '0.056', 'HITCOUNT': '0.060', 'weapon4': '0.092', 'WEAPON5': '0.100', 'AMMO3': '0.110', 'DAMAGECOUNT': '0.180', 'WEAPON3': '0.550', 'weapon3': '0.796', 'weapon2': '0.972'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:46,294][63769] DAMAGECOUNT value on done: 389.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:46,294][63769] Sum rewards: -8.171, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.620', 'weapon5': '0.008', 'AMMO2': '0.011', 'AMMO5': '0.015', 'AMMO4': '0.054', 'weapon4': '0.056', 'HITCOUNT': '0.090', 'WEAPON4': '0.150', 'AMMO3': '0.160', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.900', 'weapon3': '0.914', 'FRAGCOUNT': '1.000', 'weapon2': '1.076'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:46,638][63769] DAMAGECOUNT value on done: 145.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:47,173][63805] DAMAGECOUNT value on done: 380.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:47,174][63805] Sum rewards: -6.813, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.328', 'AMMO5': '0.013', 'AMMO2': '0.017', 'weapon5': '0.026', 'HITCOUNT': '0.050', 'AMMO4': '0.086', 'AMMO3': '0.087', 'DAMAGECOUNT': '0.135', 'WEAPON4': '0.150', 'weapon4': '0.162', 'WEAPON5': '0.200', 'weapon3': '0.372', 'WEAPON3': '0.450', 'ARMOR': '0.525', 'FRAGCOUNT': '1.000', 'weapon2': '1.492'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:47,458][109198] Fps is (10 sec: 11059.0, 60 sec: 11195.7, 300 sec: 10681.1). Total num frames: 1388544. Throughput: 0: 1245.2, 1: 1554.9. Samples: 340918. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:47,460][109198] Avg episode reward: [(0, '-6.786'), (1, '-6.714')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:47,608][63805] DAMAGECOUNT value on done: 507.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:50,283][63732] Updated weights for policy 0, policy_version 160 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:51,268][63733] Updated weights for policy 1, policy_version 190 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:52,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11195.7, 300 sec: 10710.3). Total num frames: 1445888. Throughput: 0: 1210.6, 1: 1585.6. Samples: 357897. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:52,460][109198] Avg episode reward: [(0, '-6.786'), (1, '-6.730')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:57,304][63733] Updated weights for policy 1, policy_version 200 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:57,458][109198] Fps is (10 sec: 11878.5, 60 sec: 11332.3, 300 sec: 10766.6). Total num frames: 1507328. Throughput: 0: 1177.7, 1: 1625.3. Samples: 374989. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:38:57,460][109198] Avg episode reward: [(0, '-6.786'), (1, '-6.730')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:38:59,126][63732] Updated weights for policy 0, policy_version 170 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:01,953][63735] DAMAGECOUNT value on done: 305.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:01,954][63735] Sum rewards: -8.183, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.139', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.003', 'AMMO2': '0.019', 'ARMOR': '0.034', 'weapon5': '0.042', 'WEAPON5': '0.050', 'weapon4': '0.086', 'AMMO4': '0.093', 'HITCOUNT': '0.140', 'AMMO3': '0.150', 'WEAPON4': '0.150', 'weapon3': '0.446', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.650', 'weapon2': '1.598'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:02,306][63735] DAMAGECOUNT value on done: 225.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:02,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11264.0, 300 sec: 10762.6). Total num frames: 1560576. Throughput: 0: 1161.2, 1: 1641.8. Samples: 383534. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:02,460][109198] Avg episode reward: [(0, '-6.802'), (1, '-6.730')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:02,896][63767] DAMAGECOUNT value on done: 293.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:03,214][63767] DAMAGECOUNT value on done: 389.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:03,306][63734] DAMAGECOUNT value on done: 630.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:03,399][63733] Updated weights for policy 1, policy_version 210 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:03,407][63805] DAMAGECOUNT value on done: 262.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:03,678][63734] DAMAGECOUNT value on done: 170.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:03,726][63805] DAMAGECOUNT value on done: 271.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:04,939][63771] DAMAGECOUNT value on done: 188.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:05,275][63767] DAMAGECOUNT value on done: 371.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:05,276][63767] Sum rewards: -6.189, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.010', 'FRAGCOUNT': '-0.500', 'ARMOR': '0.004', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.023', 'weapon5': '0.032', 'HITCOUNT': '0.080', 'AMMO3': '0.093', 'AMMO4': '0.113', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.228', 'WEAPON4': '0.250', 'weapon4': '0.368', 'WEAPON3': '0.500', 'weapon3': '0.654', 'weapon2': '1.054'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:05,323][63771] DAMAGECOUNT value on done: 322.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:05,323][63771] Sum rewards: -8.277, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.605', 'FRAGCOUNT': '-1.500', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'AMMO5': '0.003', 'ARMOR': '0.008', 'weapon5': '0.030', 'WEAPON5': '0.050', 'HITCOUNT': '0.080', 'AMMO3': '0.144', 'DAMAGECOUNT': '0.300', 'weapon3': '0.678', 'WEAPON3': '0.700', 'weapon2': '1.094'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:05,618][63767] DAMAGECOUNT value on done: 348.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:05,619][63767] Sum rewards: -4.488, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.822', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO4': '0.025', 'AMMO3': '0.050', 'WEAPON5': '0.050', 'ARMOR': '0.072', 'HITCOUNT': '0.080', 'WEAPON3': '0.250', 'DAMAGECOUNT': '0.255', 'weapon3': '0.636', 'FRAGCOUNT': '1.000', 'weapon2': '1.408'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:06,464][63769] DAMAGECOUNT value on done: 494.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:06,464][63769] Sum rewards: -2.672, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.505', 'AMMO2': '0.005', 'weapon4': '0.006', 'AMMO4': '0.025', 'ARMOR': '0.040', 'HITCOUNT': '0.050', 'WEAPON4': '0.050', 'AMMO3': '0.099', 'DAMAGECOUNT': '0.195', 'weapon3': '0.408', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon2': '1.504'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:06,694][63735] DAMAGECOUNT value on done: 337.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:06,785][63769] DAMAGECOUNT value on done: 209.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:07,092][63735] DAMAGECOUNT value on done: 323.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:07,223][63806] DAMAGECOUNT value on done: 430.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:07,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11264.0, 300 sec: 10786.1). Total num frames: 1617920. Throughput: 0: 1145.0, 1: 1658.7. Samples: 400651. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:07,460][109198] Avg episode reward: [(0, '-6.800'), (1, '-6.742')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:07,517][63806] DAMAGECOUNT value on done: 397.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:07,517][63806] Sum rewards: -2.603, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.084', 'weapon4': '0.004', 'AMMO2': '0.017', 'HITCOUNT': '0.050', 'ARMOR': '0.056', 'AMMO4': '0.085', 'weapon7': '0.086', 'AMMO3': '0.113', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.150', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.468', 'WEAPON3': '0.600', 'weapon2': '0.910', 'FRAGCOUNT': '1.000', 'weapon3': '1.002'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:07,563][63806] DAMAGECOUNT value on done: 251.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:07,564][63806] Sum rewards: -6.511, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.510', 'AMMO2': '0.003', 'AMMO5': '0.005', 'AMMO4': '0.013', 'HITCOUNT': '0.070', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.106', 'AMMO3': '0.129', 'DAMAGECOUNT': '0.345', 'ARMOR': '0.498', 'WEAPON3': '0.650', 'weapon3': '0.902', 'FRAGCOUNT': '1.000', 'weapon2': '1.078'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:07,733][63770] DAMAGECOUNT value on done: 205.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:07,916][63732] Updated weights for policy 0, policy_version 180 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:07,947][63734] DAMAGECOUNT value on done: 270.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:07,957][63806] DAMAGECOUNT value on done: 563.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:07,958][63806] Sum rewards: -4.806, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.602', 'weapon5': '0.006', 'AMMO5': '0.013', 'AMMO2': '0.023', 'HITCOUNT': '0.090', 'AMMO4': '0.116', 'AMMO3': '0.161', 'weapon4': '0.206', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.405', 'ARMOR': '0.436', 'WEAPON3': '0.800', 'weapon3': '0.800', 'weapon2': '0.940', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:08,129][63770] DAMAGECOUNT value on done: 320.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:08,129][63770] Sum rewards: -5.319, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.232', 'HITCOUNT': '0.010', 'DAMAGECOUNT': '0.015', 'AMMO2': '0.019', 'ARMOR': '0.044', 'AMMO4': '0.095', 'AMMO3': '0.131', 'weapon4': '0.172', 'WEAPON4': '0.250', 'WEAPON3': '0.600', 'weapon3': '0.624', 'FRAGCOUNT': '1.000', 'weapon2': '1.202'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:08,348][63734] DAMAGECOUNT value on done: 227.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:08,348][63734] Sum rewards: -3.605, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.098', 'AMMO5': '0.003', 'weapon5': '0.014', 'AMMO2': '0.019', 'HITCOUNT': '0.050', 'WEAPON5': '0.050', 'ARMOR': '0.072', 'AMMO3': '0.081', 'AMMO4': '0.096', 'DAMAGECOUNT': '0.150', 'WEAPON4': '0.200', 'weapon4': '0.268', 'WEAPON3': '0.400', 'weapon3': '0.736', 'weapon2': '0.854', 'FRAGCOUNT': '1.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:08,441][63771] DAMAGECOUNT value on done: 443.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:08,820][63771] DAMAGECOUNT value on done: 328.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:09,302][63770] DAMAGECOUNT value on done: 121.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:09,472][63769] DAMAGECOUNT value on done: 434.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:09,564][63733] Updated weights for policy 1, policy_version 220 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:09,698][63770] DAMAGECOUNT value on done: 333.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:09,893][63769] DAMAGECOUNT value on done: 170.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:11,945][63805] DAMAGECOUNT value on done: 380.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:12,346][63805] DAMAGECOUNT value on done: 552.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:12,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11195.8, 300 sec: 10781.7). Total num frames: 1671168. Throughput: 0: 1144.6, 1: 1655.9. Samples: 417357. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:12,459][109198] Avg episode reward: [(0, '-6.705'), (1, '-6.626')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:12,461][63576] Saving new best policy, reward=-6.626!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:15,734][63733] Updated weights for policy 1, policy_version 230 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:16,870][63732] Updated weights for policy 0, policy_version 190 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:17,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11264.0, 300 sec: 10803.2). Total num frames: 1728512. Throughput: 0: 1151.5, 1: 1666.9. Samples: 425979. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:17,460][109198] Avg episode reward: [(0, '-6.705'), (1, '-6.626')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:21,814][63733] Updated weights for policy 1, policy_version 240 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:22,458][109198] Fps is (10 sec: 11878.4, 60 sec: 11264.0, 300 sec: 10848.2). Total num frames: 1789952. Throughput: 0: 1156.5, 1: 1669.9. Samples: 443005. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:22,460][109198] Avg episode reward: [(0, '-6.705'), (1, '-6.626')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:23,971][63735] DAMAGECOUNT value on done: 380.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:24,319][63735] DAMAGECOUNT value on done: 272.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:25,167][63771] Large shaping reward -2.534 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.28500000000000003, -95.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:25,180][63767] DAMAGECOUNT value on done: 352.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:25,181][63767] Sum rewards: -2.168, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.642', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.060', 'AMMO3': '0.120', 'DAMAGECOUNT': '0.177', 'ARMOR': '0.420', 'WEAPON3': '0.600', 'weapon3': '0.902', 'FRAGCOUNT': '1.000', 'weapon2': '1.196'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:25,509][63767] DAMAGECOUNT value on done: 532.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:25,510][63767] Sum rewards: -9.286, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.160', 'AMMO2': '0.016', 'ARMOR': '0.021', 'HITCOUNT': '0.070', 'AMMO4': '0.079', 'weapon4': '0.112', 'AMMO3': '0.131', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.429', 'weapon3': '0.624', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.292'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:25,679][63732] Updated weights for policy 0, policy_version 200 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:26,858][63805] DAMAGECOUNT value on done: 415.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:27,049][63734] DAMAGECOUNT value on done: 653.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:27,198][63805] DAMAGECOUNT value on done: 306.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:27,199][63805] Sum rewards: -4.060, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.580', 'WEAPON1': '0.010', 'AMMO2': '0.012', 'weapon5': '0.020', 'AMMO5': '0.022', 'weapon4': '0.026', 'HITCOUNT': '0.030', 'WEAPON4': '0.050', 'AMMO3': '0.059', 'AMMO4': '0.061', 'DAMAGECOUNT': '0.105', 'WEAPON3': '0.300', 'WEAPON5': '0.350', 'weapon3': '0.360', 'FRAGCOUNT': '1.000', 'weapon2': '1.614'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:27,458][109198] Fps is (10 sec: 11878.3, 60 sec: 11332.2, 300 sec: 10866.5). Total num frames: 1847296. Throughput: 0: 1158.6, 1: 1673.5. Samples: 459851. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:27,460][109198] Avg episode reward: [(0, '-6.721'), (1, '-6.617')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:27,465][63576] Saving new best policy, reward=-6.617!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:27,477][63734] DAMAGECOUNT value on done: 200.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:27,932][63733] Updated weights for policy 1, policy_version 250 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:28,279][63767] DAMAGECOUNT value on done: 411.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:28,280][63767] Sum rewards: -5.215, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.984', 'AMMO2': '0.005', 'AMMO5': '0.009', 'weapon5': '0.016', 'WEAPON1': '0.020', 'AMMO4': '0.024', 'HITCOUNT': '0.040', 'weapon4': '0.086', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.120', 'AMMO3': '0.158', 'WEAPON5': '0.200', 'ARMOR': '0.470', 'WEAPON3': '0.850', 'weapon3': '0.870', 'FRAGCOUNT': '1.000', 'weapon2': '1.050'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:28,619][63771] DAMAGECOUNT value on done: 253.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:28,678][63767] DAMAGECOUNT value on done: 483.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:28,679][63767] Sum rewards: -6.509, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.827', 'AMMO2': '0.016', 'AMMO4': '0.078', 'HITCOUNT': '0.080', 'AMMO3': '0.130', 'WEAPON4': '0.150', 'weapon4': '0.390', 'DAMAGECOUNT': '0.405', 'ARMOR': '0.469', 'weapon3': '0.546', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.154'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:28,971][63771] DAMAGECOUNT value on done: 432.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:28,971][63771] Sum rewards: -12.244, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.820', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.009', 'AMMO2': '0.011', 'weapon5': '0.012', 'weapon4': '0.022', 'AMMO4': '0.056', 'HITCOUNT': '0.070', 'WEAPON4': '0.100', 'AMMO3': '0.139', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.330', 'weapon3': '0.472', 'WEAPON3': '0.750', 'ARMOR': '0.910', 'weapon2': '1.494'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:29,854][63769] DAMAGECOUNT value on done: 494.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:30,179][63769] DAMAGECOUNT value on done: 290.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:30,179][63769] Sum rewards: -6.576, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.086', 'weapon5': '0.002', 'AMMO5': '0.005', 'AMMO2': '0.013', 'AMMO4': '0.064', 'AMMO3': '0.065', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.110', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.243', 'WEAPON3': '0.350', 'weapon3': '0.604', 'FRAGCOUNT': '1.000', 'weapon2': '1.404'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:30,487][63770] DAMAGECOUNT value on done: 205.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:30,488][63770] Sum rewards: -6.232, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.070', 'AMMO5': '0.009', 'AMMO2': '0.016', 'weapon5': '0.028', 'AMMO4': '0.079', 'weapon4': '0.088', 'WEAPON5': '0.100', 'AMMO3': '0.127', 'WEAPON4': '0.200', 'WEAPON3': '0.700', 'weapon3': '0.742', 'weapon2': '0.998'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:30,847][63770] DAMAGECOUNT value on done: 325.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:31,136][63735] DAMAGECOUNT value on done: 410.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:31,483][63735] DAMAGECOUNT value on done: 367.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:31,483][63735] Sum rewards: -7.312, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.316', 'AMMO2': '0.001', 'AMMO5': '0.003', 'AMMO4': '0.007', 'weapon5': '0.010', 'HITCOUNT': '0.050', 'WEAPON5': '0.050', 'ARMOR': '0.056', 'weapon4': '0.094', 'WEAPON4': '0.100', 'AMMO3': '0.103', 'DAMAGECOUNT': '0.132', 'WEAPON3': '0.350', 'weapon3': '0.410', 'weapon2': '1.638'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:31,698][63806] DAMAGECOUNT value on done: 676.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:32,036][63806] DAMAGECOUNT value on done: 416.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:32,079][63806] DAMAGECOUNT value on done: 266.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:32,434][63806] DAMAGECOUNT value on done: 563.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:32,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11332.3, 300 sec: 10860.3). Total num frames: 1900544. Throughput: 0: 1159.1, 1: 1672.1. Samples: 468321. Policy #0 lag: (min: 0.0, avg: 0.3, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:32,460][109198] Avg episode reward: [(0, '-6.668'), (1, '-6.367')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:32,461][63576] Saving new best policy, reward=-6.367!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:32,946][63769] DAMAGECOUNT value on done: 434.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:33,242][63734] DAMAGECOUNT value on done: 311.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:33,242][63734] Sum rewards: -1.769, reward structure: {'DEATHCOUNT': '-6.000', 'weapon7': '0.008', 'AMMO2': '0.025', 'weapon4': '0.042', 'HEALTH': '0.044', 'HITCOUNT': '0.050', 'AMMO3': '0.056', 'ARMOR': '0.056', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'DAMAGECOUNT': '0.123', 'AMMO4': '0.126', 'WEAPON4': '0.200', 'WEAPON3': '0.250', 'weapon3': '0.856', 'FRAGCOUNT': '1.000', 'weapon2': '1.094'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:33,267][63769] DAMAGECOUNT value on done: 227.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:33,268][63769] Sum rewards: -9.022, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.984', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'weapon5': '0.016', 'AMMO2': '0.039', 'HITCOUNT': '0.050', 'WEAPON5': '0.150', 'AMMO3': '0.159', 'DAMAGECOUNT': '0.171', 'weapon4': '0.190', 'AMMO4': '0.194', 'WEAPON4': '0.400', 'WEAPON3': '0.850', 'weapon3': '0.910', 'weapon2': '1.066'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:33,409][63771] DAMAGECOUNT value on done: 472.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:33,667][63734] DAMAGECOUNT value on done: 227.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:33,842][63771] DAMAGECOUNT value on done: 347.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:33,842][63771] Sum rewards: -2.550, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.374', 'HITCOUNT': '0.020', 'AMMO2': '0.040', 'DAMAGECOUNT': '0.057', 'AMMO3': '0.093', 'ARMOR': '0.136', 'AMMO4': '0.201', 'WEAPON3': '0.500', 'WEAPON4': '0.550', 'weapon3': '0.568', 'weapon4': '0.638', 'FRAGCOUNT': '1.000', 'weapon2': '1.020'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:34,049][63733] Updated weights for policy 1, policy_version 260 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:34,196][63770] DAMAGECOUNT value on done: 231.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:34,196][63770] Sum rewards: -2.723, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.720', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.015', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'weapon5': '0.054', 'HITCOUNT': '0.060', 'AMMO3': '0.105', 'weapon4': '0.106', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.450', 'weapon3': '0.730', 'weapon2': '0.914', 'FRAGCOUNT': '1.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:34,556][63732] Updated weights for policy 0, policy_version 210 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:34,608][63770] DAMAGECOUNT value on done: 474.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:34,609][63770] Sum rewards: -7.619, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.182', 'AMMO2': '0.021', 'ARMOR': '0.032', 'AMMO4': '0.103', 'HITCOUNT': '0.130', 'AMMO3': '0.152', 'WEAPON4': '0.200', 'weapon4': '0.312', 'DAMAGECOUNT': '0.423', 'weapon3': '0.682', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.008'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:36,710][63805] DAMAGECOUNT value on done: 435.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:37,109][63805] DAMAGECOUNT value on done: 596.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:37,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11332.3, 300 sec: 10877.2). Total num frames: 1957888. Throughput: 0: 1158.8, 1: 1674.4. Samples: 485388. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:37,460][109198] Avg episode reward: [(0, '-6.551'), (1, '-6.275')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:37,466][63576] Saving new best policy, reward=-6.275!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:40,288][63733] Updated weights for policy 1, policy_version 270 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:42,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11264.0, 300 sec: 10871.0). Total num frames: 2011136. Throughput: 0: 1156.1, 1: 1666.7. Samples: 502016. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:42,460][109198] Avg episode reward: [(0, '-6.551'), (1, '-6.275')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:43,408][63732] Updated weights for policy 0, policy_version 220 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:46,457][63733] Updated weights for policy 1, policy_version 280 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:46,470][63735] DAMAGECOUNT value on done: 399.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:46,797][63735] DAMAGECOUNT value on done: 287.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:47,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11332.3, 300 sec: 10886.8). Total num frames: 2068480. Throughput: 0: 1154.7, 1: 1665.0. Samples: 510420. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:47,460][109198] Avg episode reward: [(0, '-6.553'), (1, '-6.275')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:47,583][63767] DAMAGECOUNT value on done: 437.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:47,584][63767] Sum rewards: -8.293, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.980', 'FRAGCOUNT': '-1.500', 'AMMO2': '0.013', 'AMMO5': '0.019', 'weapon5': '0.052', 'AMMO4': '0.064', 'HITCOUNT': '0.090', 'ARMOR': '0.095', 'AMMO3': '0.139', 'WEAPON4': '0.200', 'weapon4': '0.204', 'DAMAGECOUNT': '0.255', 'WEAPON5': '0.300', 'weapon2': '0.694', 'WEAPON3': '0.700', 'weapon3': '0.862'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:47,956][63767] DAMAGECOUNT value on done: 532.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:50,318][63805] DAMAGECOUNT value on done: 430.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:50,318][63805] Sum rewards: -9.257, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.062', 'FRAGCOUNT': '-1.500', 'weapon5': '0.010', 'AMMO5': '0.012', 'HITCOUNT': '0.020', 'AMMO2': '0.036', 'DAMAGECOUNT': '0.045', 'ARMOR': '0.064', 'AMMO3': '0.160', 'AMMO4': '0.178', 'WEAPON5': '0.250', 'WEAPON4': '0.450', 'weapon4': '0.458', 'weapon3': '0.670', 'WEAPON3': '0.800', 'weapon2': '0.902'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:50,645][63805] DAMAGECOUNT value on done: 306.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:51,078][63734] DAMAGECOUNT value on done: 678.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:51,480][63734] DAMAGECOUNT value on done: 370.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:51,481][63734] Sum rewards: -2.105, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO2': '0.019', 'AMMO4': '0.093', 'AMMO3': '0.098', 'HEALTH': '0.107', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'weapon4': '0.214', 'ARMOR': '0.436', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.510', 'weapon3': '0.848', 'FRAGCOUNT': '1.000', 'weapon2': '1.290'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:51,674][63767] DAMAGECOUNT value on done: 611.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:51,674][63767] Sum rewards: -6.341, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.832', 'AMMO2': '0.008', 'weapon4': '0.018', 'ARMOR': '0.024', 'AMMO4': '0.038', 'WEAPON4': '0.100', 'AMMO3': '0.151', 'HITCOUNT': '0.190', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.850', 'weapon2': '1.150', 'weapon3': '1.362', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:52,083][63767] DAMAGECOUNT value on done: 543.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:52,084][63767] Sum rewards: -8.489, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.994', 'AMMO5': '0.003', 'weapon5': '0.010', 'AMMO2': '0.012', 'ARMOR': '0.016', 'weapon4': '0.020', 'WEAPON5': '0.050', 'AMMO4': '0.059', 'HITCOUNT': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.161', 'DAMAGECOUNT': '0.180', 'weapon3': '0.642', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.572'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:52,290][63771] DAMAGECOUNT value on done: 278.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:52,308][63732] Updated weights for policy 0, policy_version 230 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:52,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11332.3, 300 sec: 10901.7). Total num frames: 2125824. Throughput: 0: 1153.7, 1: 1662.7. Samples: 527387. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:52,460][109198] Avg episode reward: [(0, '-6.510'), (1, '-6.260')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:52,462][63576] Saving new best policy, reward=-6.260!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:52,648][63733] Updated weights for policy 1, policy_version 290 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:52,684][63771] DAMAGECOUNT value on done: 687.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:52,685][63771] Sum rewards: -6.425, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.572', 'AMMO5': '0.007', 'AMMO2': '0.017', 'ARMOR': '0.028', 'AMMO4': '0.086', 'AMMO3': '0.145', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'weapon4': '0.188', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.765', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.000', 'weapon3': '1.110'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:53,248][63770] DAMAGECOUNT value on done: 255.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:53,322][63769] DAMAGECOUNT value on done: 514.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:53,591][63770] DAMAGECOUNT value on done: 360.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:53,592][63770] Sum rewards: -10.518, reward structure: {'DEATHCOUNT': '-12.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.450', 'AMMO5': '0.009', 'AMMO2': '0.010', 'weapon5': '0.028', 'HITCOUNT': '0.030', 'weapon4': '0.034', 'AMMO4': '0.048', 'WEAPON4': '0.050', 'ARMOR': '0.056', 'DAMAGECOUNT': '0.105', 'WEAPON5': '0.150', 'AMMO3': '0.179', 'weapon3': '0.852', 'WEAPON3': '0.900', 'weapon2': '0.980'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:53,638][63769] DAMAGECOUNT value on done: 374.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:53,638][63769] Sum rewards: -5.648, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.260', 'AMMO5': '0.005', 'AMMO2': '0.019', 'weapon5': '0.030', 'HITCOUNT': '0.070', 'AMMO4': '0.092', 'WEAPON5': '0.100', 'AMMO3': '0.114', 'WEAPON4': '0.150', 'weapon4': '0.176', 'DAMAGECOUNT': '0.252', 'WEAPON3': '0.600', 'weapon3': '0.604', 'FRAGCOUNT': '1.000', 'weapon2': '1.150'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:55,748][63735] DAMAGECOUNT value on done: 522.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:55,748][63735] Sum rewards: -7.142, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.968', 'AMMO2': '0.007', 'AMMO5': '0.009', 'AMMO4': '0.034', 'HITCOUNT': '0.090', 'weapon5': '0.100', 'AMMO3': '0.124', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'weapon4': '0.232', 'DAMAGECOUNT': '0.336', 'WEAPON3': '0.450', 'weapon3': '0.484', 'FRAGCOUNT': '1.000', 'weapon2': '1.360'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:56,088][63806] DAMAGECOUNT value on done: 781.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:56,088][63806] Sum rewards: 0.056, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-0.443', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'ARMOR': '0.036', 'HITCOUNT': '0.060', 'AMMO3': '0.065', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.315', 'weapon3': '0.800', 'weapon2': '0.948', 'FRAGCOUNT': '1.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:56,143][63735] DAMAGECOUNT value on done: 487.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:56,143][63735] Sum rewards: -4.359, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.023', 'AMMO5': '0.004', 'AMMO2': '0.017', 'HITCOUNT': '0.060', 'AMMO4': '0.082', 'weapon5': '0.086', 'AMMO3': '0.099', 'WEAPON5': '0.100', 'ARMOR': '0.112', 'weapon4': '0.188', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.450', 'weapon3': '0.548', 'FRAGCOUNT': '1.000', 'weapon2': '1.058'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:56,359][63769] DAMAGECOUNT value on done: 504.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:56,455][63806] DAMAGECOUNT value on done: 416.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:56,506][63806] DAMAGECOUNT value on done: 316.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:56,720][63769] DAMAGECOUNT value on done: 267.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:56,864][63806] DAMAGECOUNT value on done: 597.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:56,864][63806] Sum rewards: -6.710, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.580', 'AMMO5': '0.005', 'AMMO2': '0.018', 'HITCOUNT': '0.040', 'ARMOR': '0.056', 'AMMO4': '0.091', 'DAMAGECOUNT': '0.102', 'weapon4': '0.110', 'AMMO3': '0.118', 'WEAPON4': '0.200', 'weapon3': '0.638', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.592'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:57,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11195.8, 300 sec: 10895.4). Total num frames: 2179072. Throughput: 0: 1153.9, 1: 1664.2. Samples: 544172. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:39:57,460][109198] Avg episode reward: [(0, '-6.524'), (1, '-6.236')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:57,466][63576] Saving new best policy, reward=-6.236!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:58,650][63771] DAMAGECOUNT value on done: 517.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:58,666][63734] DAMAGECOUNT value on done: 336.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:58,837][63733] Updated weights for policy 1, policy_version 300 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:59,050][63771] DAMAGECOUNT value on done: 402.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:59,063][63734] DAMAGECOUNT value on done: 294.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:59,063][63734] Sum rewards: -5.722, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.174', 'AMMO2': '0.006', 'AMMO5': '0.010', 'weapon5': '0.016', 'ARMOR': '0.028', 'AMMO4': '0.030', 'HITCOUNT': '0.070', 'AMMO3': '0.091', 'WEAPON4': '0.100', 'weapon4': '0.126', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.201', 'WEAPON3': '0.500', 'weapon3': '0.714', 'FRAGCOUNT': '1.000', 'weapon2': '1.410'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:59,134][63770] DAMAGECOUNT value on done: 241.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:39:59,563][63770] DAMAGECOUNT value on done: 534.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:01,235][63732] Updated weights for policy 0, policy_version 240 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:01,649][63805] DAMAGECOUNT value on done: 495.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:01,650][63805] Sum rewards: -4.256, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.045', 'AMMO5': '0.005', 'AMMO2': '0.021', 'WEAPON5': '0.050', 'ARMOR': '0.060', 'HITCOUNT': '0.060', 'weapon4': '0.062', 'AMMO3': '0.071', 'AMMO4': '0.106', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.180', 'WEAPON3': '0.350', 'weapon3': '0.422', 'FRAGCOUNT': '1.000', 'weapon2': '1.752'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:02,052][63805] DAMAGECOUNT value on done: 756.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:02,053][63805] Sum rewards: -8.149, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.190', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.013', 'weapon4': '0.020', 'ARMOR': '0.048', 'AMMO4': '0.063', 'weapon5': '0.068', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'WEAPON5': '0.150', 'AMMO3': '0.184', 'DAMAGECOUNT': '0.480', 'weapon3': '0.802', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.286'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:02,458][109198] Fps is (10 sec: 11059.0, 60 sec: 11264.0, 300 sec: 10909.4). Total num frames: 2236416. Throughput: 0: 1152.8, 1: 1663.9. Samples: 552730. Policy #0 lag: (min: 0.0, avg: 0.3, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:02,460][109198] Avg episode reward: [(0, '-6.463'), (1, '-6.344')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:04,909][63733] Updated weights for policy 1, policy_version 310 (0.0013)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:07,458][109198] Fps is (10 sec: 11878.2, 60 sec: 11332.2, 300 sec: 10942.2). Total num frames: 2297856. Throughput: 0: 1153.1, 1: 1664.0. Samples: 569776. Policy #0 lag: (min: 0.0, avg: 0.1, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:07,460][109198] Avg episode reward: [(0, '-6.463'), (1, '-6.344')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:08,537][63735] DAMAGECOUNT value on done: 524.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:08,538][63735] Sum rewards: -3.630, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO5': '0.003', 'AMMO2': '0.013', 'weapon5': '0.022', 'WEAPON5': '0.050', 'weapon4': '0.052', 'AMMO4': '0.067', 'AMMO3': '0.084', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'HEALTH': '0.290', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.450', 'weapon3': '0.932', 'FRAGCOUNT': '1.000', 'weapon2': '1.082'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:08,879][63735] DAMAGECOUNT value on done: 367.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:08,880][63735] Sum rewards: -4.753, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.262', 'AMMO5': '0.009', 'AMMO2': '0.026', 'ARMOR': '0.044', 'HITCOUNT': '0.050', 'weapon5': '0.050', 'weapon4': '0.052', 'AMMO3': '0.083', 'AMMO4': '0.130', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.240', 'WEAPON3': '0.400', 'weapon3': '0.786', 'FRAGCOUNT': '1.000', 'weapon2': '1.238'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:09,155][63767] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:09,852][63767] DAMAGECOUNT value on done: 437.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:10,008][63732] Updated weights for policy 0, policy_version 250 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:10,235][63767] DAMAGECOUNT value on done: 627.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:10,236][63767] Sum rewards: -11.783, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-3.000', 'HEALTH': '-1.900', 'AMMO4': '-0.040', 'AMMO2': '-0.008', 'AMMO5': '0.007', 'weapon5': '0.014', 'ARMOR': '0.036', 'HITCOUNT': '0.080', 'WEAPON5': '0.150', 'AMMO3': '0.170', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.750', 'weapon3': '0.850', 'weapon2': '1.322'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:10,990][63733] Updated weights for policy 1, policy_version 320 (0.0013)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:12,458][109198] Fps is (10 sec: 11469.0, 60 sec: 11332.3, 300 sec: 10935.4). Total num frames: 2351104. Throughput: 0: 1155.2, 1: 1668.0. Samples: 586898. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:12,460][109198] Avg episode reward: [(0, '-6.447'), (1, '-6.344')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:13,674][63805] DAMAGECOUNT value on done: 430.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:14,061][63805] DAMAGECOUNT value on done: 538.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:14,665][63734] DAMAGECOUNT value on done: 754.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:14,666][63734] Sum rewards: 0.013, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.462', 'AMMO5': '0.003', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'weapon5': '0.038', 'weapon7': '0.042', 'WEAPON5': '0.050', 'ARMOR': '0.052', 'AMMO3': '0.070', 'HITCOUNT': '0.090', 'AMMO4': '0.092', 'WEAPON4': '0.150', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.228', 'WEAPON3': '0.400', 'weapon4': '0.420', 'weapon3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.032'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:14,719][63767] DAMAGECOUNT value on done: 716.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:14,720][63767] Sum rewards: -0.510, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.439', 'AMMO2': '0.021', 'AMMO3': '0.092', 'AMMO4': '0.106', 'HITCOUNT': '0.120', 'WEAPON4': '0.200', 'weapon4': '0.212', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.450', 'weapon2': '1.034', 'weapon3': '1.128', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:15,015][63734] DAMAGECOUNT value on done: 505.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:15,016][63734] Sum rewards: -6.053, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.688', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO2': '0.022', 'weapon5': '0.024', 'ARMOR': '0.060', 'HITCOUNT': '0.080', 'AMMO4': '0.109', 'WEAPON5': '0.150', 'AMMO3': '0.159', 'WEAPON4': '0.200', 'weapon4': '0.234', 'DAMAGECOUNT': '0.405', 'weapon3': '0.660', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.452'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:15,066][63767] DAMAGECOUNT value on done: 751.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:15,066][63767] Sum rewards: -2.996, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.042', 'AMMO5': '0.010', 'AMMO2': '0.040', 'AMMO3': '0.078', 'HITCOUNT': '0.080', 'weapon5': '0.144', 'weapon4': '0.176', 'AMMO4': '0.198', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'weapon3': '0.298', 'WEAPON3': '0.400', 'ARMOR': '0.432', 'DAMAGECOUNT': '0.624', 'FRAGCOUNT': '1.000', 'weapon2': '1.366'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:15,876][63770] DAMAGECOUNT value on done: 279.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:15,876][63770] Sum rewards: -4.207, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.430', 'AMMO5': '0.005', 'AMMO2': '0.011', 'weapon5': '0.018', 'WEAPON1': '0.020', 'HITCOUNT': '0.030', 'ARMOR': '0.040', 'AMMO4': '0.057', 'AMMO3': '0.072', 'DAMAGECOUNT': '0.072', 'WEAPON5': '0.100', 'weapon4': '0.136', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon3': '0.510', 'FRAGCOUNT': '1.000', 'weapon2': '1.302'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:15,931][63771] DAMAGECOUNT value on done: 298.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:16,250][63771] DAMAGECOUNT value on done: 766.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:16,252][63770] DAMAGECOUNT value on done: 370.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:16,511][63769] DAMAGECOUNT value on done: 564.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:16,843][63769] DAMAGECOUNT value on done: 489.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:16,844][63769] Sum rewards: -6.617, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.900', 'AMMO5': '0.005', 'AMMO2': '0.019', 'weapon5': '0.040', 'HITCOUNT': '0.070', 'AMMO4': '0.092', 'WEAPON5': '0.100', 'AMMO3': '0.119', 'WEAPON4': '0.150', 'weapon4': '0.158', 'DAMAGECOUNT': '0.345', 'WEAPON3': '0.650', 'weapon3': '0.718', 'FRAGCOUNT': '1.000', 'weapon2': '1.568'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:17,059][63733] Updated weights for policy 1, policy_version 330 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:17,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11332.2, 300 sec: 10947.5). Total num frames: 2408448. Throughput: 0: 1155.1, 1: 1666.9. Samples: 595314. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:17,460][109198] Avg episode reward: [(0, '-6.462'), (1, '-6.185')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:17,468][63576] Saving new best policy, reward=-6.185!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:18,824][63732] Updated weights for policy 0, policy_version 260 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:19,598][63769] DAMAGECOUNT value on done: 549.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:19,599][63769] Sum rewards: -5.427, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.076', 'AMMO5': '0.003', 'weapon5': '0.006', 'AMMO2': '0.020', 'WEAPON5': '0.050', 'HITCOUNT': '0.050', 'AMMO4': '0.098', 'AMMO3': '0.115', 'DAMAGECOUNT': '0.135', 'ARMOR': '0.400', 'WEAPON3': '0.650', 'weapon2': '1.156', 'weapon3': '1.466'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:19,928][63769] DAMAGECOUNT value on done: 295.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:19,992][63735] DAMAGECOUNT value on done: 641.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:19,993][63735] Sum rewards: 0.354, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-0.090', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'ARMOR': '0.028', 'WEAPON5': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.080', 'WEAPON3': '0.250', 'DAMAGECOUNT': '0.357', 'weapon3': '0.974', 'FRAGCOUNT': '1.000', 'weapon2': '1.400'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:20,376][63735] DAMAGECOUNT value on done: 662.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:20,377][63735] Sum rewards: -1.505, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.570', 'AMMO2': '0.008', 'AMMO5': '0.010', 'HITCOUNT': '0.040', 'AMMO4': '0.041', 'WEAPON4': '0.050', 'weapon4': '0.056', 'weapon5': '0.088', 'WEAPON5': '0.100', 'AMMO3': '0.104', 'WEAPON3': '0.350', 'ARMOR': '0.400', 'DAMAGECOUNT': '0.525', 'weapon3': '0.612', 'weapon2': '1.430', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:20,565][63806] DAMAGECOUNT value on done: 926.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:20,566][63806] Sum rewards: -5.633, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.638', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.024', 'ARMOR': '0.076', 'weapon4': '0.080', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.117', 'AMMO3': '0.120', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.550', 'weapon3': '0.610', 'FRAGCOUNT': '1.000', 'weapon2': '1.430'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:20,952][63806] DAMAGECOUNT value on done: 561.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:20,952][63806] Sum rewards: -7.367, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.822', 'ARMOR': '0.010', 'AMMO2': '0.021', 'HITCOUNT': '0.100', 'AMMO4': '0.107', 'weapon4': '0.124', 'AMMO3': '0.148', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.435', 'weapon3': '0.552', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.408'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:20,998][63806] DAMAGECOUNT value on done: 406.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:20,998][63806] Sum rewards: -3.244, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.744', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO2': '0.027', 'WEAPON5': '0.050', 'ARMOR': '0.064', 'HITCOUNT': '0.070', 'AMMO3': '0.114', 'AMMO4': '0.132', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.270', 'weapon4': '0.402', 'WEAPON3': '0.650', 'weapon2': '0.970', 'weapon3': '0.996', 'FRAGCOUNT': '1.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:21,373][63806] DAMAGECOUNT value on done: 618.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:21,374][63806] Sum rewards: -9.688, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-0.914', 'AMMO5': '0.003', 'HITCOUNT': '0.020', 'WEAPON1': '0.020', 'AMMO2': '0.021', 'ARMOR': '0.041', 'WEAPON5': '0.050', 'DAMAGECOUNT': '0.063', 'weapon4': '0.104', 'AMMO4': '0.106', 'AMMO3': '0.122', 'WEAPON4': '0.200', 'WEAPON3': '0.650', 'weapon3': '0.840', 'FRAGCOUNT': '1.000', 'weapon2': '1.486'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:22,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11264.0, 300 sec: 10959.1). Total num frames: 2465792. Throughput: 0: 1155.4, 1: 1666.4. Samples: 612369. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:22,460][109198] Avg episode reward: [(0, '-6.412'), (1, '-6.070')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:22,461][63576] Saving new best policy, reward=-6.070!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:23,181][63733] Updated weights for policy 1, policy_version 340 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:23,517][63771] DAMAGECOUNT value on done: 587.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:23,518][63771] Sum rewards: -10.440, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-3.190', 'AMMO2': '0.006', 'ARMOR': '0.032', 'AMMO4': '0.032', 'weapon4': '0.034', 'HITCOUNT': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.207', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.022', 'weapon2': '1.126'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:23,546][63734] DAMAGECOUNT value on done: 486.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:23,546][63734] Sum rewards: -7.179, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.364', 'AMMO5': '0.003', 'AMMO2': '0.010', 'WEAPON1': '0.020', 'HITCOUNT': '0.040', 'weapon4': '0.042', 'AMMO4': '0.052', 'WEAPON5': '0.100', 'weapon5': '0.106', 'AMMO3': '0.124', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.550', 'weapon3': '0.606', 'FRAGCOUNT': '1.000', 'weapon2': '1.432'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:23,900][63771] DAMAGECOUNT value on done: 472.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:23,936][63734] DAMAGECOUNT value on done: 328.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:23,937][63734] Sum rewards: -7.742, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.742', 'AMMO2': '0.017', 'HITCOUNT': '0.030', 'weapon4': '0.064', 'AMMO4': '0.083', 'AMMO3': '0.100', 'DAMAGECOUNT': '0.102', 'WEAPON4': '0.150', 'WEAPON3': '0.500', 'weapon3': '0.990', 'FRAGCOUNT': '1.000', 'weapon2': '1.464'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:24,152][63770] DAMAGECOUNT value on done: 257.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:24,566][63770] DAMAGECOUNT value on done: 549.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:26,554][63805] DAMAGECOUNT value on done: 529.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:26,554][63805] Sum rewards: -9.187, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.190', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.007', 'AMMO2': '0.011', 'weapon5': '0.012', 'WEAPON1': '0.020', 'HITCOUNT': '0.030', 'weapon4': '0.036', 'ARMOR': '0.040', 'AMMO4': '0.054', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.102', 'AMMO3': '0.193', 'weapon3': '0.786', 'WEAPON3': '0.900', 'weapon2': '1.362'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:26,969][63805] DAMAGECOUNT value on done: 1022.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:26,969][63805] Sum rewards: -3.183, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.892', 'AMMO5': '0.010', 'AMMO2': '0.014', 'ARMOR': '0.024', 'weapon5': '0.052', 'AMMO4': '0.071', 'WEAPON5': '0.100', 'AMMO3': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'weapon4': '0.288', 'DAMAGECOUNT': '0.798', 'WEAPON3': '0.850', 'weapon2': '0.952', 'weapon3': '1.080', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:27,458][109198] Fps is (10 sec: 11059.4, 60 sec: 11195.8, 300 sec: 10952.4). Total num frames: 2519040. Throughput: 0: 1156.7, 1: 1672.6. Samples: 629337. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:27,460][109198] Avg episode reward: [(0, '-6.440'), (1, '-6.055')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:27,465][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000269_1101824.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:27,518][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000347_1421312.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:27,574][63576] Saving new best policy, reward=-6.055!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:27,770][63732] Updated weights for policy 0, policy_version 270 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:29,360][63733] Updated weights for policy 1, policy_version 350 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:30,529][63735] DAMAGECOUNT value on done: 575.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:30,899][63735] DAMAGECOUNT value on done: 576.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:30,899][63735] Sum rewards: -5.638, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.396', 'AMMO2': '0.017', 'ARMOR': '0.071', 'AMMO4': '0.083', 'weapon4': '0.086', 'AMMO3': '0.180', 'WEAPON4': '0.200', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.627', 'weapon3': '0.942', 'WEAPON3': '1.000', 'weapon2': '1.092', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:32,310][63767] DAMAGECOUNT value on done: 482.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:32,310][63767] Sum rewards: -8.822, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.486', 'AMMO2': '0.021', 'HITCOUNT': '0.040', 'weapon4': '0.046', 'AMMO4': '0.103', 'ARMOR': '0.108', 'DAMAGECOUNT': '0.135', 'WEAPON4': '0.150', 'AMMO3': '0.203', 'weapon3': '0.624', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.284'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:32,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11332.3, 300 sec: 10980.8). Total num frames: 2580480. Throughput: 0: 1157.5, 1: 1672.8. Samples: 637784. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:32,460][109198] Avg episode reward: [(0, '-6.341'), (1, '-6.055')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:32,623][63767] DAMAGECOUNT value on done: 682.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:32,624][63767] Sum rewards: -6.076, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.830', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'AMMO5': '0.003', 'HITCOUNT': '0.050', 'AMMO3': '0.132', 'DAMAGECOUNT': '0.165', 'ARMOR': '0.487', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.096', 'weapon2': '1.152'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:35,054][63733] Updated weights for policy 1, policy_version 360 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:37,053][63805] DAMAGECOUNT value on done: 455.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:37,433][63805] DAMAGECOUNT value on done: 578.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:37,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11264.0, 300 sec: 10973.9). Total num frames: 2633728. Throughput: 0: 1136.1, 1: 1695.4. Samples: 654803. Policy #0 lag: (min: 0.0, avg: 0.1, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:37,460][109198] Avg episode reward: [(0, '-6.350'), (1, '-6.095')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:37,595][63732] Updated weights for policy 0, policy_version 280 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:37,985][63767] DAMAGECOUNT value on done: 931.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:37,986][63767] Sum rewards: -2.765, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.392', 'AMMO5': '0.007', 'AMMO2': '0.009', 'ARMOR': '0.009', 'weapon5': '0.010', 'weapon4': '0.022', 'AMMO4': '0.042', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'AMMO3': '0.130', 'HITCOUNT': '0.130', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.750', 'weapon2': '0.920', 'weapon3': '1.552', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:38,284][63770] DAMAGECOUNT value on done: 299.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:38,377][63734] DAMAGECOUNT value on done: 824.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:38,383][63767] DAMAGECOUNT value on done: 830.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:38,383][63767] Sum rewards: -5.861, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.986', 'AMMO2': '0.018', 'HITCOUNT': '0.070', 'ARMOR': '0.072', 'AMMO4': '0.087', 'AMMO3': '0.127', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.237', 'weapon4': '0.272', 'WEAPON3': '0.650', 'weapon3': '0.896', 'FRAGCOUNT': '1.000', 'weapon2': '1.246'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:38,639][63770] DAMAGECOUNT value on done: 396.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:38,756][63734] DAMAGECOUNT value on done: 561.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:38,757][63734] Sum rewards: -5.827, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.650', 'AMMO5': '0.004', 'AMMO2': '0.009', 'ARMOR': '0.035', 'weapon5': '0.038', 'AMMO4': '0.043', 'HITCOUNT': '0.050', 'AMMO3': '0.088', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.168', 'WEAPON4': '0.200', 'weapon4': '0.252', 'WEAPON3': '0.500', 'weapon3': '0.998', 'FRAGCOUNT': '1.000', 'weapon2': '1.338'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:39,462][63771] DAMAGECOUNT value on done: 408.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:39,814][63771] DAMAGECOUNT value on done: 826.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:39,814][63771] Sum rewards: -4.640, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.456', 'AMMO5': '0.005', 'AMMO2': '0.009', 'WEAPON1': '0.020', 'weapon5': '0.022', 'AMMO4': '0.045', 'HITCOUNT': '0.050', 'AMMO3': '0.091', 'WEAPON5': '0.100', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.180', 'weapon4': '0.206', 'ARMOR': '0.476', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.020', 'weapon2': '1.142'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:39,938][63769] DAMAGECOUNT value on done: 597.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:40,342][63769] DAMAGECOUNT value on done: 509.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:40,714][63733] Updated weights for policy 1, policy_version 370 (0.0013)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:42,458][109198] Fps is (10 sec: 10649.6, 60 sec: 11264.0, 300 sec: 10967.3). Total num frames: 2686976. Throughput: 0: 1119.2, 1: 1709.9. Samples: 671481. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:42,460][109198] Avg episode reward: [(0, '-6.331'), (1, '-6.118')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:43,095][63769] DAMAGECOUNT value on done: 676.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:43,096][63769] Sum rewards: -4.532, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.450', 'AMMO5': '0.003', 'weapon5': '0.004', 'WEAPON1': '0.010', 'AMMO2': '0.028', 'weapon4': '0.032', 'WEAPON5': '0.050', 'ARMOR': '0.055', 'AMMO3': '0.095', 'HITCOUNT': '0.120', 'AMMO4': '0.139', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.381', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.036', 'weapon2': '1.266'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:43,421][63769] DAMAGECOUNT value on done: 339.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:44,410][63735] DAMAGECOUNT value on done: 696.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:44,743][63735] DAMAGECOUNT value on done: 677.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:45,183][63806] DAMAGECOUNT value on done: 926.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:45,540][63806] DAMAGECOUNT value on done: 621.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:45,583][63806] DAMAGECOUNT value on done: 472.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:45,894][63806] DAMAGECOUNT value on done: 663.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:46,785][63733] Updated weights for policy 1, policy_version 380 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:46,871][63732] Updated weights for policy 0, policy_version 290 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:47,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11332.3, 300 sec: 10993.7). Total num frames: 2748416. Throughput: 0: 1116.9, 1: 1709.4. Samples: 679913. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:47,460][109198] Avg episode reward: [(0, '-6.428'), (1, '-6.031')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:47,466][63576] Saving new best policy, reward=-6.031!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:48,580][63771] DAMAGECOUNT value on done: 692.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:48,581][63771] Sum rewards: -5.147, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.171', 'AMMO2': '0.024', 'AMMO3': '0.092', 'HITCOUNT': '0.110', 'AMMO4': '0.120', 'weapon4': '0.142', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.315', 'ARMOR': '0.472', 'WEAPON3': '0.500', 'weapon3': '0.762', 'FRAGCOUNT': '1.000', 'weapon2': '1.186'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:48,894][63734] DAMAGECOUNT value on done: 511.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:48,988][63771] DAMAGECOUNT value on done: 509.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:49,222][63770] DAMAGECOUNT value on done: 257.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:49,223][63770] Sum rewards: -9.235, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.799', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.007', 'AMMO2': '0.011', 'weapon5': '0.018', 'ARMOR': '0.044', 'weapon4': '0.050', 'AMMO4': '0.053', 'AMMO3': '0.127', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon3': '0.598', 'WEAPON3': '0.600', 'weapon2': '1.256'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:49,317][63734] DAMAGECOUNT value on done: 578.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:49,318][63734] Sum rewards: -4.419, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.060', 'weapon5': '0.002', 'AMMO5': '0.007', 'AMMO2': '0.015', 'weapon4': '0.072', 'AMMO4': '0.073', 'ARMOR': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.150', 'AMMO3': '0.183', 'DAMAGECOUNT': '0.750', 'WEAPON3': '0.950', 'weapon2': '1.230', 'weapon3': '1.418', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:49,655][63770] DAMAGECOUNT value on done: 648.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:51,529][63805] DAMAGECOUNT value on done: 550.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:51,920][63805] DAMAGECOUNT value on done: 1059.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:52,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11264.0, 300 sec: 10986.9). Total num frames: 2801664. Throughput: 0: 1139.4, 1: 1676.9. Samples: 696505. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:52,460][109198] Avg episode reward: [(0, '-6.432'), (1, '-6.015')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:52,462][63576] Saving new best policy, reward=-6.015!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:53,571][63735] DAMAGECOUNT value on done: 725.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:53,572][63735] Sum rewards: -6.895, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.770', 'AMMO2': '0.007', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.035', 'ARMOR': '0.044', 'weapon5': '0.044', 'HITCOUNT': '0.100', 'AMMO3': '0.136', 'WEAPON4': '0.150', 'weapon4': '0.172', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.134', 'weapon2': '1.282'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:53,894][63735] DAMAGECOUNT value on done: 736.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:53,895][63735] Sum rewards: 0.413, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-0.741', 'AMMO2': '0.015', 'ARMOR': '0.052', 'AMMO4': '0.076', 'AMMO3': '0.086', 'WEAPON4': '0.100', 'weapon4': '0.134', 'HITCOUNT': '0.160', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.500', 'weapon2': '0.852', 'FRAGCOUNT': '1.000', 'weapon3': '1.448'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:53,922][63732] Updated weights for policy 0, policy_version 300 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:54,157][63733] Updated weights for policy 1, policy_version 390 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:54,761][63767] DAMAGECOUNT value on done: 581.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:55,086][63767] DAMAGECOUNT value on done: 740.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:57,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11400.5, 300 sec: 11011.9). Total num frames: 2863104. Throughput: 0: 1196.7, 1: 1621.6. Samples: 713722. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:40:57,460][109198] Avg episode reward: [(0, '-6.524'), (1, '-5.934')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:40:57,467][63576] Saving new best policy, reward=-5.934!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:00,199][63732] Updated weights for policy 0, policy_version 310 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:00,260][63805] DAMAGECOUNT value on done: 571.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:00,656][63805] DAMAGECOUNT value on done: 733.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:00,656][63805] Sum rewards: -4.640, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.746', 'AMMO5': '0.005', 'AMMO2': '0.005', 'weapon5': '0.018', 'AMMO4': '0.026', 'weapon4': '0.070', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.120', 'AMMO3': '0.140', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.600', 'weapon3': '0.854', 'weapon2': '1.602', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:00,884][63767] DAMAGECOUNT value on done: 1256.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:00,884][63767] Sum rewards: -4.573, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.544', 'AMMO5': '0.003', 'AMMO2': '0.028', 'weapon5': '0.034', 'ARMOR': '0.037', 'WEAPON5': '0.050', 'weapon4': '0.092', 'AMMO3': '0.136', 'HITCOUNT': '0.140', 'AMMO4': '0.140', 'WEAPON4': '0.200', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.975', 'weapon2': '1.104', 'weapon3': '1.532'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:01,246][63767] DAMAGECOUNT value on done: 854.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:01,247][63767] Sum rewards: -6.743, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.834', 'AMMO2': '0.007', 'AMMO5': '0.007', 'weapon5': '0.026', 'HITCOUNT': '0.030', 'AMMO4': '0.035', 'ARMOR': '0.052', 'DAMAGECOUNT': '0.072', 'WEAPON4': '0.100', 'AMMO3': '0.129', 'WEAPON5': '0.150', 'weapon4': '0.312', 'WEAPON3': '0.700', 'weapon2': '0.874', 'weapon3': '1.346'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:01,359][63770] DAMAGECOUNT value on done: 401.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:01,359][63770] Sum rewards: -4.085, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.192', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'WEAPON4': '0.050', 'ARMOR': '0.052', 'weapon4': '0.072', 'HITCOUNT': '0.080', 'AMMO3': '0.140', 'DAMAGECOUNT': '0.306', 'WEAPON3': '0.650', 'weapon3': '0.664', 'weapon2': '1.344', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:01,737][63770] DAMAGECOUNT value on done: 491.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:01,737][63770] Sum rewards: -6.156, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.020', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'AMMO5': '0.005', 'weapon5': '0.020', 'HITCOUNT': '0.090', 'WEAPON5': '0.100', 'AMMO3': '0.164', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.850', 'weapon3': '0.952', 'FRAGCOUNT': '1.000', 'weapon2': '1.424'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:02,365][63733] Updated weights for policy 1, policy_version 400 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:02,458][109198] Fps is (10 sec: 11878.3, 60 sec: 11400.5, 300 sec: 11020.6). Total num frames: 2920448. Throughput: 0: 1228.8, 1: 1597.8. Samples: 722510. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:02,460][109198] Avg episode reward: [(0, '-6.489'), (1, '-5.849')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:02,461][63576] Saving new best policy, reward=-5.849!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:02,696][63771] DAMAGECOUNT value on done: 538.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:02,697][63771] Sum rewards: -4.509, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.420', 'AMMO2': '0.004', 'AMMO5': '0.010', 'weapon5': '0.010', 'AMMO4': '0.022', 'WEAPON4': '0.050', 'HITCOUNT': '0.080', 'WEAPON5': '0.100', 'weapon4': '0.108', 'AMMO3': '0.132', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.082', 'weapon3': '1.322'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:03,012][63771] DAMAGECOUNT value on done: 871.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:03,317][63769] DAMAGECOUNT value on done: 627.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:03,317][63769] Sum rewards: -8.132, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.500', 'AMMO5': '0.005', 'AMMO2': '0.026', 'HITCOUNT': '0.040', 'weapon5': '0.046', 'DAMAGECOUNT': '0.090', 'WEAPON5': '0.100', 'AMMO4': '0.130', 'AMMO3': '0.144', 'WEAPON3': '0.850', 'weapon2': '1.120', 'weapon3': '1.316'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:03,633][63769] DAMAGECOUNT value on done: 529.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:03,634][63769] Sum rewards: -5.408, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.848', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'HITCOUNT': '0.020', 'AMMO2': '0.035', 'ARMOR': '0.040', 'weapon5': '0.040', 'DAMAGECOUNT': '0.060', 'WEAPON5': '0.100', 'AMMO3': '0.113', 'weapon4': '0.120', 'AMMO4': '0.177', 'WEAPON4': '0.200', 'WEAPON3': '0.600', 'weapon2': '0.850', 'weapon3': '1.320'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:03,717][63734] DAMAGECOUNT value on done: 960.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:04,154][63734] DAMAGECOUNT value on done: 711.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:06,590][63732] Updated weights for policy 0, policy_version 320 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:07,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11332.3, 300 sec: 11028.9). Total num frames: 2977792. Throughput: 0: 1285.4, 1: 1540.8. Samples: 739547. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:07,460][109198] Avg episode reward: [(0, '-6.512'), (1, '-5.664')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:07,467][63576] Saving new best policy, reward=-5.664!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:07,652][63806] DAMAGECOUNT value on done: 983.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:07,652][63806] Sum rewards: -8.018, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.654', 'WEAPON1': '0.010', 'AMMO2': '0.039', 'ARMOR': '0.046', 'HITCOUNT': '0.080', 'AMMO3': '0.108', 'weapon4': '0.138', 'DAMAGECOUNT': '0.171', 'AMMO4': '0.194', 'WEAPON4': '0.350', 'WEAPON3': '0.450', 'weapon3': '0.782', 'FRAGCOUNT': '1.000', 'weapon2': '1.268'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:07,995][63806] DAMAGECOUNT value on done: 721.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:08,041][63806] DAMAGECOUNT value on done: 477.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:08,075][63769] DAMAGECOUNT value on done: 876.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:08,075][63769] Sum rewards: -0.375, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO2': '0.003', 'AMMO5': '0.005', 'ARMOR': '0.008', 'AMMO4': '0.013', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.097', 'WEAPON5': '0.100', 'weapon5': '0.138', 'HEALTH': '0.151', 'weapon4': '0.214', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.600', 'weapon3': '0.802', 'weapon2': '0.964', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:08,331][63806] DAMAGECOUNT value on done: 768.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:08,427][63769] DAMAGECOUNT value on done: 468.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:08,897][63735] DAMAGECOUNT value on done: 731.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:09,293][63735] DAMAGECOUNT value on done: 817.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:09,294][63735] Sum rewards: -5.902, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.572', 'AMMO4': '-0.010', 'AMMO2': '-0.002', 'AMMO5': '0.003', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'HITCOUNT': '0.130', 'AMMO3': '0.167', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.800', 'weapon2': '0.946', 'weapon3': '1.626', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:10,422][63733] Updated weights for policy 1, policy_version 410 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:12,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11400.5, 300 sec: 11036.9). Total num frames: 3035136. Throughput: 0: 1350.0, 1: 1484.4. Samples: 756884. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:12,460][109198] Avg episode reward: [(0, '-6.514'), (1, '-5.599')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:12,462][63576] Saving new best policy, reward=-5.599!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:12,538][63770] DAMAGECOUNT value on done: 302.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:12,671][63734] DAMAGECOUNT value on done: 640.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:12,671][63734] Sum rewards: -7.568, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.380', 'AMMO5': '0.010', 'AMMO2': '0.016', 'ARMOR': '0.032', 'WEAPON1': '0.040', 'AMMO4': '0.080', 'weapon4': '0.090', 'HITCOUNT': '0.100', 'AMMO3': '0.127', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.387', 'WEAPON3': '0.700', 'weapon3': '0.910', 'FRAGCOUNT': '1.000', 'weapon2': '1.170'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:12,883][63732] Updated weights for policy 0, policy_version 330 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:12,905][63770] DAMAGECOUNT value on done: 682.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:13,062][63734] DAMAGECOUNT value on done: 693.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:13,063][63734] Sum rewards: -2.003, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.250', 'AMMO5': '0.007', 'AMMO2': '0.011', 'WEAPON1': '0.020', 'weapon4': '0.022', 'weapon5': '0.034', 'AMMO4': '0.054', 'ARMOR': '0.076', 'AMMO3': '0.099', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.345', 'WEAPON3': '0.600', 'weapon2': '0.778', 'FRAGCOUNT': '1.000', 'weapon3': '1.150'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:13,629][63771] DAMAGECOUNT value on done: 947.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:13,629][63771] Sum rewards: -2.109, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.370', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.025', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'AMMO3': '0.123', 'HITCOUNT': '0.250', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.765', 'weapon2': '1.104', 'weapon3': '1.128', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:13,943][63771] DAMAGECOUNT value on done: 664.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:13,944][63771] Sum rewards: -1.548, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.348', 'AMMO5': '0.005', 'weapon5': '0.024', 'ARMOR': '0.032', 'AMMO2': '0.033', 'AMMO3': '0.080', 'HITCOUNT': '0.090', 'WEAPON5': '0.100', 'AMMO4': '0.163', 'weapon4': '0.178', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.465', 'weapon3': '0.932', 'weapon2': '1.498', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:14,740][63805] DAMAGECOUNT value on done: 635.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:15,122][63805] DAMAGECOUNT value on done: 1083.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:15,123][63805] Sum rewards: -4.585, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.233', 'AMMO2': '0.003', 'AMMO4': '0.015', 'HITCOUNT': '0.030', 'ARMOR': '0.044', 'DAMAGECOUNT': '0.072', 'AMMO3': '0.106', 'WEAPON3': '0.500', 'weapon3': '0.672', 'FRAGCOUNT': '1.000', 'weapon2': '1.456'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:15,860][63735] DAMAGECOUNT value on done: 798.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:16,247][63735] DAMAGECOUNT value on done: 856.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:16,248][63735] Sum rewards: -5.727, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.122', 'AMMO2': '0.016', 'HITCOUNT': '0.060', 'AMMO4': '0.081', 'AMMO3': '0.115', 'WEAPON4': '0.200', 'weapon4': '0.292', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.228', 'weapon2': '1.242'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:17,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11400.6, 300 sec: 11044.6). Total num frames: 3092480. Throughput: 0: 1382.0, 1: 1460.5. Samples: 765698. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:17,460][109198] Avg episode reward: [(0, '-6.378'), (1, '-5.601')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:17,705][63767] DAMAGECOUNT value on done: 749.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:18,091][63767] DAMAGECOUNT value on done: 809.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:18,091][63767] Sum rewards: -7.499, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.792', 'AMMO2': '0.011', 'ARMOR': '0.056', 'AMMO4': '0.056', 'HITCOUNT': '0.080', 'WEAPON4': '0.100', 'weapon4': '0.142', 'AMMO3': '0.188', 'DAMAGECOUNT': '0.207', 'weapon3': '0.500', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.452'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:18,415][63733] Updated weights for policy 1, policy_version 420 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:19,197][63732] Updated weights for policy 0, policy_version 340 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:22,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11400.5, 300 sec: 11052.0). Total num frames: 3149824. Throughput: 0: 1465.7, 1: 1383.4. Samples: 783013. Policy #0 lag: (min: 0.0, avg: 0.5, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:22,460][109198] Avg episode reward: [(0, '-6.437'), (1, '-5.601')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:22,901][63805] DAMAGECOUNT value on done: 611.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:23,219][63805] DAMAGECOUNT value on done: 949.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:23,220][63805] Sum rewards: -4.407, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.350', 'AMMO2': '0.018', 'weapon4': '0.038', 'weapon7': '0.064', 'AMMO4': '0.090', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'HITCOUNT': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.159', 'DAMAGECOUNT': '0.648', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.260', 'weapon2': '1.316'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:23,461][63767] DAMAGECOUNT value on done: 1371.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:23,462][63767] Sum rewards: -9.176, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.870', 'ARMOR': '0.004', 'AMMO5': '0.007', 'weapon5': '0.010', 'AMMO2': '0.027', 'HITCOUNT': '0.100', 'AMMO4': '0.136', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'AMMO3': '0.220', 'weapon4': '0.330', 'DAMAGECOUNT': '0.345', 'WEAPON3': '1.150', 'weapon2': '1.236', 'weapon3': '1.278', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:23,792][63767] DAMAGECOUNT value on done: 989.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:24,390][63770] DAMAGECOUNT value on done: 521.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:24,391][63770] Sum rewards: -3.436, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.742', 'AMMO5': '0.007', 'AMMO2': '0.009', 'ARMOR': '0.020', 'weapon4': '0.024', 'WEAPON1': '0.040', 'AMMO4': '0.044', 'HITCOUNT': '0.060', 'weapon5': '0.064', 'WEAPON4': '0.100', 'AMMO3': '0.106', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.108', 'weapon2': '1.114'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:24,745][63770] DAMAGECOUNT value on done: 591.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:24,746][63770] Sum rewards: -4.710, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.870', 'weapon4': '0.002', 'AMMO2': '0.003', 'AMMO5': '0.009', 'HITCOUNT': '0.010', 'AMMO4': '0.013', 'weapon5': '0.038', 'ARMOR': '0.080', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.135', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.750', 'weapon3': '0.906', 'FRAGCOUNT': '1.000', 'weapon2': '1.214'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:25,489][63771] DAMAGECOUNT value on done: 538.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:25,522][63732] Updated weights for policy 0, policy_version 350 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:25,862][63771] DAMAGECOUNT value on done: 1016.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:26,092][63769] DAMAGECOUNT value on done: 1033.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:26,093][63769] Sum rewards: -2.619, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.680', 'AMMO2': '0.003', 'AMMO4': '0.014', 'AMMO3': '0.152', 'HITCOUNT': '0.240', 'weapon2': '0.904', 'WEAPON3': '0.950', 'DAMAGECOUNT': '1.218', 'weapon3': '2.080', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:26,432][63769] DAMAGECOUNT value on done: 564.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:26,432][63769] Sum rewards: -7.240, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.240', 'AMMO5': '0.010', 'AMMO2': '0.030', 'HITCOUNT': '0.030', 'DAMAGECOUNT': '0.105', 'AMMO3': '0.118', 'AMMO4': '0.149', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'weapon4': '0.252', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.020', 'weapon2': '1.436'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:26,447][63733] Updated weights for policy 1, policy_version 430 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:27,458][109198] Fps is (10 sec: 11878.5, 60 sec: 11537.1, 300 sec: 11073.3). Total num frames: 3211264. Throughput: 0: 1548.5, 1: 1318.5. Samples: 800498. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:27,460][109198] Avg episode reward: [(0, '-6.365'), (1, '-5.639')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:28,733][63734] DAMAGECOUNT value on done: 1180.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:28,733][63734] Sum rewards: -2.780, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.233', 'AMMO2': '0.004', 'AMMO5': '0.012', 'AMMO4': '0.022', 'weapon5': '0.084', 'AMMO3': '0.103', 'HITCOUNT': '0.110', 'WEAPON5': '0.250', 'WEAPON3': '0.550', 'ARMOR': '0.562', 'DAMAGECOUNT': '0.660', 'weapon2': '1.028', 'weapon3': '1.068', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:29,129][63734] DAMAGECOUNT value on done: 841.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:29,963][63806] DAMAGECOUNT value on done: 1013.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:30,219][63806] DAMAGECOUNT value on done: 820.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:30,256][63806] DAMAGECOUNT value on done: 626.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:30,257][63806] Sum rewards: -2.513, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.318', 'AMMO5': '0.007', 'AMMO2': '0.011', 'weapon5': '0.034', 'ARMOR': '0.036', 'AMMO4': '0.056', 'AMMO3': '0.088', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.447', 'weapon3': '0.988', 'FRAGCOUNT': '1.000', 'weapon2': '1.138'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:30,593][63806] DAMAGECOUNT value on done: 873.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:30,593][63806] Sum rewards: -6.500, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.050', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.011', 'AMMO2': '0.024', 'HITCOUNT': '0.050', 'ARMOR': '0.052', 'weapon4': '0.072', 'AMMO4': '0.120', 'AMMO3': '0.139', 'weapon5': '0.192', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.800', 'weapon3': '1.000', 'weapon2': '1.024'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:31,817][63732] Updated weights for policy 0, policy_version 360 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:32,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11400.5, 300 sec: 11066.2). Total num frames: 3264512. Throughput: 0: 1579.5, 1: 1291.6. Samples: 809115. Policy #0 lag: (min: 0.0, avg: 0.3, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:32,460][109198] Avg episode reward: [(0, '-6.314'), (1, '-5.682')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:32,505][63454] Saving new best policy, reward=-6.314!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:32,872][63769] DAMAGECOUNT value on done: 906.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:33,218][63735] DAMAGECOUNT value on done: 740.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:33,307][63769] DAMAGECOUNT value on done: 483.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:33,536][63735] DAMAGECOUNT value on done: 917.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:34,588][63733] Updated weights for policy 1, policy_version 440 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:35,436][63770] DAMAGECOUNT value on done: 347.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:35,437][63770] Sum rewards: -7.550, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.003', 'HITCOUNT': '0.010', 'AMMO2': '0.021', 'weapon5': '0.046', 'WEAPON5': '0.050', 'AMMO3': '0.098', 'AMMO4': '0.103', 'ARMOR': '0.114', 'DAMAGECOUNT': '0.135', 'weapon4': '0.170', 'WEAPON4': '0.200', 'HEALTH': '0.252', 'WEAPON3': '0.500', 'weapon3': '0.650', 'weapon2': '1.348'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:35,824][63770] DAMAGECOUNT value on done: 812.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:36,129][63734] DAMAGECOUNT value on done: 640.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:36,129][63734] Sum rewards: -5.132, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.005', 'AMMO2': '0.012', 'weapon5': '0.014', 'ARMOR': '0.048', 'WEAPON5': '0.050', 'AMMO4': '0.060', 'AMMO3': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.140', 'WEAPON3': '0.500', 'HEALTH': '0.721', 'weapon2': '1.048', 'weapon3': '1.070'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:36,524][63734] DAMAGECOUNT value on done: 738.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:36,525][63734] Sum rewards: -5.306, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.310', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.016', 'HITCOUNT': '0.030', 'ARMOR': '0.032', 'AMMO3': '0.077', 'AMMO4': '0.081', 'weapon4': '0.096', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.135', 'WEAPON4': '0.200', 'WEAPON3': '0.450', 'weapon3': '0.908', 'FRAGCOUNT': '1.000', 'weapon2': '1.114'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:37,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11468.8, 300 sec: 11260.5). Total num frames: 3321856. Throughput: 0: 1616.6, 1: 1268.0. Samples: 826311. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:37,460][109198] Avg episode reward: [(0, '-6.120'), (1, '-5.694')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:37,499][63454] Saving new best policy, reward=-6.120!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:37,874][63805] DAMAGECOUNT value on done: 885.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:37,874][63805] Sum rewards: -4.246, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.900', 'AMMO5': '0.005', 'AMMO2': '0.007', 'weapon5': '0.018', 'weapon4': '0.026', 'AMMO4': '0.037', 'WEAPON4': '0.050', 'ARMOR': '0.060', 'WEAPON5': '0.100', 'HITCOUNT': '0.130', 'AMMO3': '0.133', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.750', 'weapon2': '1.038', 'weapon3': '1.100', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:38,131][63732] Updated weights for policy 0, policy_version 370 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:38,242][63735] DAMAGECOUNT value on done: 1038.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:38,243][63735] Sum rewards: -2.999, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.082', 'AMMO2': '0.011', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'AMMO4': '0.056', 'AMMO3': '0.115', 'HITCOUNT': '0.190', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.720', 'weapon3': '1.004', 'weapon2': '1.504', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:38,245][63805] DAMAGECOUNT value on done: 1228.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:38,245][63805] Sum rewards: -3.678, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.190', 'ARMOR': '0.004', 'AMMO5': '0.005', 'weapon4': '0.016', 'AMMO2': '0.019', 'weapon5': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.095', 'WEAPON5': '0.100', 'AMMO3': '0.102', 'HITCOUNT': '0.120', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.114', 'weapon2': '1.282'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:38,566][63771] DAMAGECOUNT value on done: 1069.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:38,566][63771] Sum rewards: -2.054, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.856', 'AMMO2': '0.010', 'AMMO4': '0.052', 'AMMO3': '0.090', 'HITCOUNT': '0.100', 'ARMOR': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.114', 'DAMAGECOUNT': '0.366', 'WEAPON3': '0.550', 'weapon3': '0.944', 'FRAGCOUNT': '1.000', 'weapon2': '1.376'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:38,582][63735] DAMAGECOUNT value on done: 966.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:38,583][63735] Sum rewards: -6.207, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.943', 'AMMO2': '0.014', 'weapon7': '0.020', 'HITCOUNT': '0.060', 'ARMOR': '0.064', 'AMMO4': '0.071', 'weapon4': '0.090', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.223', 'DAMAGECOUNT': '0.330', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon3': '1.184', 'weapon2': '1.480'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:39,006][63771] DAMAGECOUNT value on done: 704.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:39,007][63771] Sum rewards: -5.376, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.078', 'AMMO2': '0.001', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO4': '0.003', 'HITCOUNT': '0.030', 'ARMOR': '0.032', 'WEAPON5': '0.050', 'DAMAGECOUNT': '0.120', 'AMMO3': '0.150', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.024', 'weapon3': '1.438'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:40,851][63767] DAMAGECOUNT value on done: 758.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:40,851][63767] Sum rewards: -8.112, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.263', 'AMMO5': '0.003', 'AMMO2': '0.006', 'ARMOR': '0.016', 'HITCOUNT': '0.020', 'DAMAGECOUNT': '0.027', 'WEAPON1': '0.030', 'AMMO4': '0.032', 'WEAPON5': '0.050', 'weapon4': '0.060', 'weapon5': '0.064', 'WEAPON4': '0.100', 'AMMO3': '0.144', 'WEAPON3': '0.800', 'weapon2': '1.090', 'weapon3': '1.208'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:41,194][63767] DAMAGECOUNT value on done: 883.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:41,195][63767] Sum rewards: -3.778, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.112', 'AMMO5': '0.007', 'ARMOR': '0.012', 'weapon5': '0.016', 'AMMO2': '0.022', 'HITCOUNT': '0.060', 'AMMO4': '0.109', 'AMMO3': '0.116', 'WEAPON5': '0.150', 'weapon4': '0.182', 'DAMAGECOUNT': '0.222', 'WEAPON4': '0.250', 'WEAPON3': '0.650', 'weapon3': '0.912', 'FRAGCOUNT': '1.000', 'weapon2': '1.126'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:42,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11537.1, 300 sec: 11302.2). Total num frames: 3379200. Throughput: 0: 1617.4, 1: 1266.0. Samples: 843472. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:42,460][109198] Avg episode reward: [(0, '-6.004'), (1, '-5.692')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:42,461][63454] Saving new best policy, reward=-6.004!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:42,726][63733] Updated weights for policy 1, policy_version 450 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:44,455][63732] Updated weights for policy 0, policy_version 380 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:45,326][63805] DAMAGECOUNT value on done: 675.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:45,326][63805] Sum rewards: -7.577, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.378', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO2': '0.004', 'ARMOR': '0.020', 'AMMO4': '0.022', 'WEAPON5': '0.050', 'HITCOUNT': '0.090', 'WEAPON4': '0.150', 'AMMO3': '0.163', 'DAMAGECOUNT': '0.192', 'weapon4': '0.268', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.224', 'weapon3': '1.262'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:45,689][63805] DAMAGECOUNT value on done: 1034.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:45,690][63805] Sum rewards: -7.195, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.088', 'AMMO2': '0.002', 'AMMO5': '0.003', 'AMMO4': '0.010', 'WEAPON1': '0.030', 'WEAPON5': '0.050', 'HITCOUNT': '0.080', 'weapon5': '0.096', 'AMMO3': '0.133', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.650', 'weapon3': '1.088', 'weapon2': '1.246'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:46,015][63767] DAMAGECOUNT value on done: 1493.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:46,016][63767] Sum rewards: -8.856, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.233', 'AMMO2': '0.001', 'AMMO5': '0.003', 'AMMO4': '0.004', 'weapon4': '0.036', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'ARMOR': '0.056', 'HITCOUNT': '0.070', 'AMMO3': '0.185', 'DAMAGECOUNT': '0.366', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.186', 'weapon3': '1.470'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:46,366][63767] DAMAGECOUNT value on done: 1183.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:46,366][63767] Sum rewards: -3.631, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.226', 'AMMO5': '0.003', 'AMMO2': '0.007', 'weapon5': '0.014', 'AMMO4': '0.037', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO3': '0.068', 'HITCOUNT': '0.120', 'weapon4': '0.146', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.582', 'weapon2': '0.968', 'weapon3': '1.336'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:47,315][63770] DAMAGECOUNT value on done: 531.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:47,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11468.8, 300 sec: 11302.2). Total num frames: 3436544. Throughput: 0: 1619.0, 1: 1264.1. Samples: 852248. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:47,460][109198] Avg episode reward: [(0, '-5.990'), (1, '-5.647')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:47,465][63454] Saving new best policy, reward=-5.990!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:47,704][63770] DAMAGECOUNT value on done: 646.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:48,521][63771] DAMAGECOUNT value on done: 638.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:48,872][63771] DAMAGECOUNT value on done: 1126.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:48,872][63771] Sum rewards: -6.142, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.248', 'AMMO5': '0.005', 'AMMO2': '0.015', 'weapon4': '0.044', 'AMMO4': '0.076', 'ARMOR': '0.093', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.142', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.278', 'weapon3': '1.472'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:49,066][63769] DAMAGECOUNT value on done: 1117.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:49,447][63769] DAMAGECOUNT value on done: 629.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:49,448][63769] Sum rewards: -5.832, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.844', 'AMMO2': '0.007', 'AMMO4': '0.037', 'HITCOUNT': '0.060', 'ARMOR': '0.064', 'AMMO3': '0.149', 'DAMAGECOUNT': '0.195', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.296', 'weapon2': '1.304'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:50,783][63732] Updated weights for policy 0, policy_version 390 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:50,825][63733] Updated weights for policy 1, policy_version 460 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:52,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11537.1, 300 sec: 11302.2). Total num frames: 3493888. Throughput: 0: 1623.7, 1: 1266.7. Samples: 869616. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:52,460][109198] Avg episode reward: [(0, '-5.909'), (1, '-5.766')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:52,461][63454] Saving new best policy, reward=-5.909!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:52,500][63806] DAMAGECOUNT value on done: 1038.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:52,874][63806] DAMAGECOUNT value on done: 940.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:52,923][63806] DAMAGECOUNT value on done: 646.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:53,203][63806] DAMAGECOUNT value on done: 1038.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:53,204][63806] Sum rewards: -1.778, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.958', 'AMMO5': '0.005', 'AMMO2': '0.008', 'AMMO4': '0.038', 'ARMOR': '0.040', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.116', 'WEAPON4': '0.150', 'weapon4': '0.234', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.012', 'weapon2': '1.232'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:53,761][63734] DAMAGECOUNT value on done: 1220.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:54,218][63734] DAMAGECOUNT value on done: 976.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:54,219][63734] Sum rewards: -4.631, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.744', 'AMMO4': '-0.031', 'AMMO2': '-0.006', 'weapon5': '0.014', 'AMMO5': '0.022', 'HITCOUNT': '0.080', 'AMMO3': '0.098', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.450', 'weapon3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.380'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:57,236][63732] Updated weights for policy 0, policy_version 400 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:57,458][109198] Fps is (10 sec: 11878.3, 60 sec: 11537.1, 300 sec: 11316.1). Total num frames: 3555328. Throughput: 0: 1618.3, 1: 1263.5. Samples: 886566. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:41:57,460][109198] Avg episode reward: [(0, '-5.973'), (1, '-5.723')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:58,021][63735] DAMAGECOUNT value on done: 765.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:58,063][63769] DAMAGECOUNT value on done: 956.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:58,413][63735] DAMAGECOUNT value on done: 962.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:58,485][63769] DAMAGECOUNT value on done: 593.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:58,639][63770] DAMAGECOUNT value on done: 512.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:58,639][63770] Sum rewards: -5.445, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.345', 'AMMO5': '0.003', 'AMMO2': '0.006', 'AMMO4': '0.028', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'weapon4': '0.116', 'AMMO3': '0.129', 'ARMOR': '0.486', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.700', 'weapon3': '0.972', 'FRAGCOUNT': '1.000', 'weapon2': '1.506'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:58,970][63770] DAMAGECOUNT value on done: 907.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:58,971][63770] Sum rewards: -2.420, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.245', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.014', 'ARMOR': '0.032', 'weapon5': '0.064', 'AMMO4': '0.069', 'HITCOUNT': '0.090', 'AMMO3': '0.131', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'weapon4': '0.282', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.750', 'weapon3': '0.838', 'weapon2': '1.204', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:41:59,118][63733] Updated weights for policy 1, policy_version 470 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:00,001][63734] DAMAGECOUNT value on done: 685.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:00,343][63734] DAMAGECOUNT value on done: 753.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:00,836][63735] DAMAGECOUNT value on done: 1228.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:00,836][63735] Sum rewards: -5.979, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.159', 'AMMO5': '0.007', 'AMMO2': '0.009', 'ARMOR': '0.020', 'weapon5': '0.022', 'AMMO4': '0.044', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'AMMO3': '0.166', 'weapon4': '0.170', 'HITCOUNT': '0.200', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.112', 'weapon3': '1.310'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:00,979][63805] DAMAGECOUNT value on done: 920.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:00,980][63805] Sum rewards: -3.990, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.390', 'AMMO5': '0.003', 'AMMO2': '0.018', 'weapon5': '0.020', 'HITCOUNT': '0.040', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'AMMO3': '0.085', 'AMMO4': '0.088', 'DAMAGECOUNT': '0.105', 'WEAPON4': '0.250', 'weapon4': '0.366', 'WEAPON3': '0.450', 'weapon3': '0.866', 'FRAGCOUNT': '1.000', 'weapon2': '1.270'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:01,216][63735] DAMAGECOUNT value on done: 1211.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:01,217][63735] Sum rewards: -4.265, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.570', 'AMMO5': '0.005', 'AMMO2': '0.024', 'weapon5': '0.024', 'WEAPON5': '0.100', 'AMMO4': '0.118', 'AMMO3': '0.145', 'HITCOUNT': '0.160', 'WEAPON4': '0.200', 'weapon4': '0.320', 'ARMOR': '0.460', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.735', 'weapon3': '0.792', 'weapon2': '1.122', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:01,369][63805] DAMAGECOUNT value on done: 1238.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:02,458][109198] Fps is (10 sec: 11878.3, 60 sec: 11537.1, 300 sec: 11329.9). Total num frames: 3612672. Throughput: 0: 1611.4, 1: 1260.9. Samples: 894953. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:02,460][109198] Avg episode reward: [(0, '-5.935'), (1, '-5.706')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:03,652][63732] Updated weights for policy 0, policy_version 410 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:03,760][63771] DAMAGECOUNT value on done: 1140.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:03,938][63767] DAMAGECOUNT value on done: 818.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:04,145][63771] DAMAGECOUNT value on done: 965.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:04,146][63771] Sum rewards: -1.629, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.434', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO4': '0.022', 'weapon4': '0.042', 'WEAPON5': '0.050', 'WEAPON4': '0.100', 'ARMOR': '0.114', 'AMMO3': '0.120', 'HITCOUNT': '0.190', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.783', 'weapon2': '1.188', 'weapon3': '1.536', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:04,326][63767] DAMAGECOUNT value on done: 1026.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:07,190][63733] Updated weights for policy 1, policy_version 480 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:07,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11468.8, 300 sec: 11302.2). Total num frames: 3665920. Throughput: 0: 1613.4, 1: 1261.5. Samples: 912386. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:07,460][109198] Avg episode reward: [(0, '-5.936'), (1, '-5.630')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:07,959][63805] DAMAGECOUNT value on done: 756.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:08,331][63805] DAMAGECOUNT value on done: 1144.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:08,332][63805] Sum rewards: -1.709, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.290', 'weapon5': '0.006', 'ARMOR': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.017', 'WEAPON1': '0.020', 'HITCOUNT': '0.060', 'AMMO4': '0.085', 'AMMO3': '0.089', 'WEAPON4': '0.100', 'weapon4': '0.152', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.500', 'weapon2': '0.822', 'FRAGCOUNT': '1.000', 'weapon3': '1.432'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:08,528][63767] DAMAGECOUNT value on done: 1648.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:08,921][63767] DAMAGECOUNT value on done: 1353.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:10,113][63732] Updated weights for policy 0, policy_version 420 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:10,762][63770] DAMAGECOUNT value on done: 701.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:10,763][63770] Sum rewards: -2.160, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.112', 'AMMO2': '0.025', 'AMMO3': '0.105', 'AMMO4': '0.127', 'HITCOUNT': '0.150', 'WEAPON4': '0.300', 'weapon4': '0.386', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.600', 'ARMOR': '0.879', 'weapon3': '0.982', 'weapon2': '1.138', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:11,094][63770] DAMAGECOUNT value on done: 678.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:11,632][63771] DAMAGECOUNT value on done: 753.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:11,974][63771] DAMAGECOUNT value on done: 1161.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:12,125][63769] DAMAGECOUNT value on done: 1227.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:12,459][109198] Fps is (10 sec: 11059.0, 60 sec: 11468.7, 300 sec: 11316.1). Total num frames: 3723264. Throughput: 0: 1605.4, 1: 1258.5. Samples: 929375. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:12,461][109198] Avg episode reward: [(0, '-5.968'), (1, '-5.644')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:12,464][63769] DAMAGECOUNT value on done: 689.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:15,268][63733] Updated weights for policy 1, policy_version 490 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:15,411][63806] DAMAGECOUNT value on done: 1151.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:15,412][63806] Sum rewards: -6.906, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.108', 'AMMO5': '0.010', 'AMMO2': '0.011', 'AMMO4': '0.053', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.201', 'DAMAGECOUNT': '0.309', 'weapon2': '0.960', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon3': '1.658'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:15,773][63806] DAMAGECOUNT value on done: 1140.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:15,774][63806] Sum rewards: -4.436, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.382', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'AMMO2': '0.025', 'WEAPON5': '0.050', 'weapon5': '0.052', 'ARMOR': '0.072', 'AMMO4': '0.123', 'HITCOUNT': '0.150', 'AMMO3': '0.166', 'WEAPON4': '0.200', 'weapon4': '0.214', 'DAMAGECOUNT': '0.600', 'weapon3': '0.882', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.240'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:15,818][63806] DAMAGECOUNT value on done: 646.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:16,106][63806] DAMAGECOUNT value on done: 1089.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:16,107][63806] Sum rewards: -8.801, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.957', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'WEAPON5': '0.050', 'HITCOUNT': '0.050', 'AMMO4': '0.055', 'weapon5': '0.076', 'AMMO3': '0.110', 'DAMAGECOUNT': '0.153', 'WEAPON3': '0.550', 'weapon3': '0.838', 'FRAGCOUNT': '1.000', 'weapon2': '1.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:16,319][63732] Updated weights for policy 0, policy_version 430 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:17,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11468.8, 300 sec: 11316.1). Total num frames: 3780608. Throughput: 0: 1610.8, 1: 1259.4. Samples: 938271. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:17,460][109198] Avg episode reward: [(0, '-6.049'), (1, '-5.696')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:19,071][63734] DAMAGECOUNT value on done: 1393.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:19,071][63734] Sum rewards: -6.370, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.378', 'AMMO2': '0.007', 'AMMO5': '0.007', 'ARMOR': '0.016', 'WEAPON1': '0.020', 'AMMO4': '0.034', 'weapon5': '0.090', 'HITCOUNT': '0.140', 'AMMO3': '0.147', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.519', 'WEAPON3': '0.750', 'weapon2': '0.936', 'weapon3': '1.192'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:19,509][63734] DAMAGECOUNT value on done: 1234.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:19,509][63734] Sum rewards: -4.263, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.735', 'AMMO2': '0.024', 'ARMOR': '0.072', 'AMMO3': '0.109', 'AMMO4': '0.121', 'WEAPON4': '0.150', 'HITCOUNT': '0.190', 'weapon4': '0.540', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.774', 'weapon3': '0.902', 'weapon2': '1.290', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:20,084][63805] Large shaping reward -2.603 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', 0.05, 10.0), ('AMMO2', 0.0012000000000000001, 6.0), ('WEAPON3', -0.05, -1.0), ('AMMO3', -0.008, -16.0), ('AMMO4', 0.006, 6.0), ('WEAPON5', -0.05, -1.0), ('AMMO5', -0.0025, -5.0), ('AMMO6', -0.1, -100.0), ('WEAPON7', -0.1, -1.0), ('AMMO7', -0.1, -100.0)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:21,684][63770] DAMAGECOUNT value on done: 562.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:22,081][63770] DAMAGECOUNT value on done: 1242.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:22,082][63770] Sum rewards: -1.495, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.149', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'WEAPON4': '0.050', 'AMMO4': '0.057', 'weapon4': '0.080', 'AMMO3': '0.099', 'weapon5': '0.124', 'WEAPON5': '0.200', 'HITCOUNT': '0.220', 'WEAPON3': '0.550', 'DAMAGECOUNT': '1.005', 'weapon2': '1.100', 'weapon3': '1.138', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:22,117][63735] DAMAGECOUNT value on done: 1005.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:22,118][63735] Sum rewards: -8.036, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.758', 'AMMO5': '0.010', 'ARMOR': '0.010', 'weapon5': '0.020', 'AMMO2': '0.038', 'weapon4': '0.090', 'AMMO3': '0.152', 'AMMO4': '0.188', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.720', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.204', 'weapon2': '1.510'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:22,458][109198] Fps is (10 sec: 11469.1, 60 sec: 11468.8, 300 sec: 11330.0). Total num frames: 3837952. Throughput: 0: 1613.3, 1: 1264.0. Samples: 955791. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:22,460][109198] Avg episode reward: [(0, '-6.027'), (1, '-5.682')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:22,480][63735] DAMAGECOUNT value on done: 1092.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:22,481][63735] Sum rewards: -3.107, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.436', 'AMMO5': '0.005', 'AMMO2': '0.010', 'weapon5': '0.012', 'ARMOR': '0.028', 'AMMO4': '0.052', 'AMMO3': '0.094', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon4': '0.210', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.114', 'weapon3': '1.164'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:22,649][63732] Updated weights for policy 0, policy_version 440 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:22,930][63735] DAMAGECOUNT value on done: 1324.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:22,930][63735] Sum rewards: -7.234, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.333', 'AMMO2': '0.010', 'weapon5': '0.012', 'AMMO5': '0.014', 'AMMO4': '0.049', 'ARMOR': '0.064', 'HITCOUNT': '0.070', 'AMMO3': '0.113', 'WEAPON4': '0.200', 'weapon4': '0.266', 'DAMAGECOUNT': '0.288', 'WEAPON5': '0.300', 'WEAPON3': '0.700', 'weapon2': '0.958', 'weapon3': '1.554'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:23,035][63769] DAMAGECOUNT value on done: 1121.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:23,035][63769] Sum rewards: 0.126, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.534', 'AMMO5': '0.005', 'AMMO2': '0.006', 'weapon5': '0.008', 'ARMOR': '0.028', 'AMMO4': '0.032', 'weapon7': '0.062', 'AMMO3': '0.097', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'HITCOUNT': '0.120', 'weapon4': '0.220', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.495', 'weapon2': '1.098', 'weapon3': '1.338', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:23,217][63733] Updated weights for policy 1, policy_version 500 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:23,285][63735] DAMAGECOUNT value on done: 1523.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:23,285][63735] Sum rewards: -1.863, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.876', 'WEAPON1': '0.020', 'AMMO2': '0.020', 'ARMOR': '0.080', 'AMMO4': '0.100', 'AMMO3': '0.132', 'weapon4': '0.134', 'WEAPON4': '0.200', 'HITCOUNT': '0.240', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.936', 'weapon3': '1.214', 'weapon2': '1.336', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:23,459][63769] DAMAGECOUNT value on done: 920.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:23,460][63769] Sum rewards: -1.385, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.638', 'AMMO5': '0.007', 'AMMO2': '0.018', 'ARMOR': '0.032', 'weapon5': '0.048', 'weapon7': '0.090', 'AMMO4': '0.091', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'AMMO3': '0.197', 'HITCOUNT': '0.200', 'weapon4': '0.314', 'weapon3': '0.882', 'DAMAGECOUNT': '0.981', 'WEAPON3': '1.000', 'weapon2': '1.342', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:23,679][63734] DAMAGECOUNT value on done: 910.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:23,680][63734] Sum rewards: -1.943, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.692', 'AMMO2': '0.009', 'AMMO5': '0.017', 'weapon5': '0.040', 'AMMO4': '0.042', 'ARMOR': '0.064', 'AMMO3': '0.110', 'weapon4': '0.122', 'WEAPON5': '0.150', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.700', 'weapon2': '1.248', 'weapon3': '1.442', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:24,077][63734] DAMAGECOUNT value on done: 848.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:24,078][63734] Sum rewards: -1.828, reward structure: {'DEATHCOUNT': '-5.250', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'AMMO2': '0.016', 'ARMOR': '0.025', 'weapon4': '0.038', 'HEALTH': '0.048', 'AMMO4': '0.078', 'HITCOUNT': '0.090', 'AMMO3': '0.091', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.124', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.450', 'weapon2': '1.208', 'weapon3': '1.264'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:24,133][63805] DAMAGECOUNT value on done: 1080.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:24,134][63805] Sum rewards: -11.835, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.780', 'FRAGCOUNT': '-2.000', 'AMMO2': '0.005', 'AMMO5': '0.006', 'WEAPON1': '0.020', 'AMMO4': '0.026', 'ARMOR': '0.036', 'weapon4': '0.048', 'weapon5': '0.052', 'WEAPON4': '0.100', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'HITCOUNT': '0.120', 'WEAPON5': '0.150', 'AMMO3': '0.229', 'DAMAGECOUNT': '0.480', 'WEAPON3': '1.300', 'weapon3': '1.378', 'weapon2': '1.444'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:24,461][63805] DAMAGECOUNT value on done: 1385.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:24,461][63805] Sum rewards: -5.140, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.630', 'WEAPON1': '0.010', 'AMMO5': '0.016', 'AMMO2': '0.026', 'ARMOR': '0.028', 'weapon5': '0.092', 'HITCOUNT': '0.110', 'AMMO3': '0.121', 'AMMO4': '0.132', 'WEAPON4': '0.250', 'WEAPON5': '0.250', 'weapon4': '0.394', 'DAMAGECOUNT': '0.441', 'WEAPON3': '0.650', 'weapon3': '0.938', 'weapon2': '1.282', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:26,748][63767] DAMAGECOUNT value on done: 937.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:26,748][63767] Sum rewards: -0.674, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.244', 'AMMO5': '0.007', 'AMMO2': '0.027', 'weapon5': '0.032', 'HITCOUNT': '0.120', 'AMMO3': '0.127', 'AMMO4': '0.134', 'WEAPON5': '0.150', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.357', 'weapon4': '0.386', 'ARMOR': '0.448', 'WEAPON3': '0.700', 'weapon3': '0.748', 'weapon2': '1.484', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:27,133][63767] DAMAGECOUNT value on done: 1264.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:27,133][63767] Sum rewards: -6.243, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.916', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.049', 'WEAPON5': '0.050', 'weapon5': '0.092', 'AMMO3': '0.119', 'HITCOUNT': '0.170', 'WEAPON4': '0.250', 'weapon4': '0.390', 'ARMOR': '0.456', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.714', 'weapon3': '0.966', 'weapon2': '1.202'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:27,458][109198] Fps is (10 sec: 11878.3, 60 sec: 11468.8, 300 sec: 11343.8). Total num frames: 3899392. Throughput: 0: 1614.8, 1: 1265.3. Samples: 973075. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:27,460][109198] Avg episode reward: [(0, '-5.980'), (1, '-5.477')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:27,466][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000505_2068480.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:27,466][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000447_1830912.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:27,526][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000151_618496.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:27,533][63576] Saving new best policy, reward=-5.477!\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:27,539][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000134_548864.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:28,611][63771] DAMAGECOUNT value on done: 1205.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:28,939][63732] Updated weights for policy 0, policy_version 450 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:29,074][63771] DAMAGECOUNT value on done: 1316.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:29,075][63771] Sum rewards: -2.872, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.170', 'AMMO2': '0.014', 'ARMOR': '0.044', 'AMMO4': '0.072', 'WEAPON4': '0.150', 'AMMO3': '0.197', 'weapon4': '0.200', 'HITCOUNT': '0.260', 'WEAPON3': '0.700', 'weapon3': '1.050', 'DAMAGECOUNT': '1.053', 'weapon2': '1.308', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:30,469][63805] DAMAGECOUNT value on done: 781.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:30,731][63767] DAMAGECOUNT value on done: 1897.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:30,732][63767] Sum rewards: -5.202, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.774', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'AMMO5': '0.003', 'AMMO3': '0.157', 'HITCOUNT': '0.180', 'DAMAGECOUNT': '0.747', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.348', 'weapon2': '1.384'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:30,794][63805] DAMAGECOUNT value on done: 1204.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:30,794][63805] Sum rewards: -2.883, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.780', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.003', 'weapon5': '0.036', 'WEAPON1': '0.040', 'WEAPON5': '0.050', 'AMMO3': '0.068', 'HITCOUNT': '0.070', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.100', 'DAMAGECOUNT': '0.180', 'WEAPON3': '0.400', 'weapon2': '0.952', 'FRAGCOUNT': '1.000', 'weapon3': '1.462'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:31,061][63767] DAMAGECOUNT value on done: 1473.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:31,201][63733] Updated weights for policy 1, policy_version 510 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:32,458][109198] Fps is (10 sec: 11878.2, 60 sec: 11537.0, 300 sec: 11357.7). Total num frames: 3956736. Throughput: 0: 1612.2, 1: 1266.0. Samples: 981769. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:32,461][109198] Avg episode reward: [(0, '-5.988'), (1, '-5.324')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:32,462][63576] Saving new best policy, reward=-5.324!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:33,661][63770] DAMAGECOUNT value on done: 756.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:33,662][63770] Sum rewards: -9.677, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.970', 'AMMO5': '0.005', 'AMMO2': '0.005', 'ARMOR': '0.020', 'AMMO4': '0.026', 'HITCOUNT': '0.050', 'weapon4': '0.074', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.155', 'DAMAGECOUNT': '0.165', 'WEAPON3': '0.800', 'weapon3': '0.948', 'FRAGCOUNT': '1.000', 'weapon2': '1.594'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:34,038][63770] DAMAGECOUNT value on done: 941.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:34,039][63770] Sum rewards: -1.617, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO2': '0.002', 'AMMO5': '0.007', 'AMMO4': '0.009', 'weapon5': '0.082', 'AMMO3': '0.130', 'WEAPON5': '0.150', 'HEALTH': '0.176', 'HITCOUNT': '0.180', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.789', 'FRAGCOUNT': '1.000', 'weapon2': '1.160', 'weapon3': '1.548'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:34,301][63771] DAMAGECOUNT value on done: 970.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:34,301][63771] Sum rewards: -5.358, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.598', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'AMMO5': '0.005', 'weapon5': '0.016', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'ARMOR': '0.052', 'weapon4': '0.090', 'AMMO3': '0.095', 'HITCOUNT': '0.220', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.651', 'FRAGCOUNT': '1.000', 'weapon2': '1.228', 'weapon3': '1.348'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:34,688][63771] DAMAGECOUNT value on done: 1246.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:34,901][63769] DAMAGECOUNT value on done: 1342.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:34,901][63769] Sum rewards: -6.298, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.920', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.008', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'HITCOUNT': '0.120', 'weapon4': '0.122', 'AMMO3': '0.158', 'DAMAGECOUNT': '0.345', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.010', 'weapon3': '1.670'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:35,278][63769] DAMAGECOUNT value on done: 748.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:35,278][63769] Sum rewards: -1.147, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.980', 'AMMO5': '0.005', 'AMMO2': '0.008', 'WEAPON1': '0.020', 'AMMO4': '0.041', 'weapon5': '0.048', 'HITCOUNT': '0.050', 'AMMO3': '0.063', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.104', 'DAMAGECOUNT': '0.177', 'WEAPON3': '0.400', 'ARMOR': '0.472', 'FRAGCOUNT': '1.000', 'weapon3': '1.230', 'weapon2': '1.264'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:35,298][63732] Updated weights for policy 0, policy_version 460 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:37,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11537.1, 300 sec: 11357.7). Total num frames: 4014080. Throughput: 0: 1610.6, 1: 1266.9. Samples: 999104. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:37,460][109198] Avg episode reward: [(0, '-6.017'), (1, '-5.424')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:37,857][63806] DAMAGECOUNT value on done: 1299.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:37,857][63806] Sum rewards: -7.312, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.190', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.012', 'AMMO5': '0.013', 'AMMO4': '0.062', 'ARMOR': '0.064', 'weapon5': '0.076', 'HITCOUNT': '0.120', 'weapon4': '0.170', 'AMMO3': '0.176', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.444', 'WEAPON3': '0.800', 'weapon3': '1.052', 'weapon2': '1.388'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:38,138][63806] DAMAGECOUNT value on done: 1440.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:38,138][63806] Sum rewards: -3.615, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.870', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'AMMO2': '0.015', 'weapon7': '0.060', 'AMMO4': '0.074', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.100', 'AMMO3': '0.139', 'HITCOUNT': '0.160', 'weapon4': '0.172', 'WEAPON4': '0.200', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.900', 'weapon2': '1.130', 'weapon3': '1.250'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:38,184][63806] DAMAGECOUNT value on done: 813.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:38,184][63806] Sum rewards: -3.809, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.172', 'AMMO5': '0.003', 'AMMO2': '0.009', 'ARMOR': '0.024', 'AMMO4': '0.044', 'WEAPON5': '0.050', 'AMMO3': '0.114', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.501', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.384', 'weapon2': '1.424'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:38,543][63806] DAMAGECOUNT value on done: 1173.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:38,544][63806] Sum rewards: -11.490, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-2.946', 'AMMO5': '0.013', 'AMMO2': '0.015', 'ARMOR': '0.060', 'AMMO4': '0.072', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'weapon4': '0.116', 'AMMO3': '0.232', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.252', 'FRAGCOUNT': '1.000', 'weapon3': '1.082', 'WEAPON3': '1.150', 'weapon2': '1.274'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:39,354][63733] Updated weights for policy 1, policy_version 520 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:41,599][63732] Updated weights for policy 0, policy_version 470 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:42,458][109198] Fps is (10 sec: 11469.0, 60 sec: 11537.1, 300 sec: 11371.6). Total num frames: 4071424. Throughput: 0: 1614.6, 1: 1271.2. Samples: 1016428. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:42,459][109198] Avg episode reward: [(0, '-5.964'), (1, '-5.424')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:44,383][63734] DAMAGECOUNT value on done: 1453.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:44,383][63734] Sum rewards: -8.302, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.562', 'AMMO5': '0.004', 'weapon4': '0.012', 'AMMO2': '0.012', 'weapon5': '0.034', 'WEAPON4': '0.050', 'AMMO4': '0.061', 'HITCOUNT': '0.070', 'WEAPON5': '0.100', 'AMMO3': '0.158', 'DAMAGECOUNT': '0.180', 'ARMOR': '0.452', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.900', 'weapon2': '1.354', 'weapon3': '1.372'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:44,777][63770] DAMAGECOUNT value on done: 577.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:44,794][63734] DAMAGECOUNT value on done: 1562.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:44,795][63734] Sum rewards: -1.245, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.793', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.019', 'ARMOR': '0.036', 'AMMO4': '0.095', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.163', 'HITCOUNT': '0.220', 'weapon2': '0.696', 'DAMAGECOUNT': '0.984', 'WEAPON3': '1.000', 'weapon3': '1.870', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:45,014][63735] DAMAGECOUNT value on done: 1561.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:45,014][63735] Sum rewards: -2.968, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.582', 'AMMO2': '0.008', 'AMMO4': '0.041', 'WEAPON4': '0.050', 'ARMOR': '0.116', 'AMMO3': '0.156', 'HITCOUNT': '0.170', 'weapon4': '0.290', 'DAMAGECOUNT': '0.711', 'WEAPON3': '0.800', 'weapon2': '0.990', 'weapon3': '1.282', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:45,101][63770] DAMAGECOUNT value on done: 1367.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:45,102][63770] Sum rewards: -6.046, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.859', 'AMMO2': '0.002', 'AMMO4': '0.009', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'weapon4': '0.086', 'HITCOUNT': '0.110', 'AMMO3': '0.151', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.012', 'weapon3': '1.636'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:45,355][63735] DAMAGECOUNT value on done: 1623.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:46,384][63735] DAMAGECOUNT value on done: 1055.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:46,385][63735] Sum rewards: -5.626, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.330', 'AMMO5': '0.008', 'AMMO2': '0.009', 'WEAPON1': '0.020', 'HITCOUNT': '0.040', 'AMMO4': '0.043', 'weapon5': '0.044', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'weapon4': '0.100', 'AMMO3': '0.110', 'DAMAGECOUNT': '0.150', 'ARMOR': '0.509', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.044', 'weapon2': '1.578'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:46,769][63735] DAMAGECOUNT value on done: 1122.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:46,769][63735] Sum rewards: -4.885, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.160', 'AMMO2': '0.026', 'HITCOUNT': '0.030', 'DAMAGECOUNT': '0.090', 'AMMO4': '0.128', 'AMMO3': '0.162', 'ARMOR': '0.441', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.066', 'weapon3': '1.782'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:47,359][63805] DAMAGECOUNT value on done: 1280.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:47,360][63805] Sum rewards: -11.179, reward structure: {'DEATHCOUNT': '-14.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.835', 'AMMO5': '0.008', 'WEAPON1': '0.010', 'ARMOR': '0.016', 'AMMO2': '0.032', 'weapon5': '0.070', 'weapon4': '0.074', 'WEAPON5': '0.150', 'AMMO4': '0.162', 'AMMO3': '0.175', 'HITCOUNT': '0.190', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.950', 'weapon3': '1.174', 'weapon2': '1.494'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:47,431][63733] Updated weights for policy 1, policy_version 530 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:47,458][109198] Fps is (10 sec: 11878.6, 60 sec: 11605.3, 300 sec: 11385.5). Total num frames: 4132864. Throughput: 0: 1619.4, 1: 1271.3. Samples: 1025034. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:47,459][109198] Avg episode reward: [(0, '-5.942'), (1, '-5.400')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:47,540][63734] DAMAGECOUNT value on done: 940.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:47,712][63805] DAMAGECOUNT value on done: 1645.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:47,713][63805] Sum rewards: -7.892, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.710', 'AMMO5': '0.013', 'AMMO2': '0.024', 'WEAPON1': '0.030', 'weapon5': '0.046', 'AMMO3': '0.111', 'AMMO4': '0.120', 'HITCOUNT': '0.120', 'WEAPON5': '0.200', 'weapon4': '0.218', 'WEAPON4': '0.250', 'ARMOR': '0.445', 'WEAPON3': '0.600', 'weapon3': '0.648', 'DAMAGECOUNT': '0.780', 'FRAGCOUNT': '1.500', 'weapon2': '1.712'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:47,900][63734] DAMAGECOUNT value on done: 878.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:47,900][63734] Sum rewards: -8.083, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-3.000', 'HEALTH': '-2.230', 'AMMO2': '0.020', 'WEAPON1': '0.020', 'HITCOUNT': '0.020', 'AMMO5': '0.021', 'DAMAGECOUNT': '0.090', 'AMMO4': '0.099', 'AMMO3': '0.119', 'weapon4': '0.120', 'weapon5': '0.138', 'WEAPON4': '0.300', 'WEAPON5': '0.350', 'ARMOR': '0.492', 'WEAPON3': '0.700', 'weapon3': '0.866', 'weapon2': '1.292'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:47,914][63769] DAMAGECOUNT value on done: 1161.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:48,002][63732] Updated weights for policy 0, policy_version 480 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:48,400][63769] DAMAGECOUNT value on done: 1030.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:48,400][63769] Sum rewards: -5.927, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.814', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.007', 'AMMO2': '0.021', 'weapon5': '0.046', 'HITCOUNT': '0.100', 'AMMO4': '0.102', 'ARMOR': '0.116', 'WEAPON5': '0.150', 'AMMO3': '0.151', 'WEAPON4': '0.200', 'weapon4': '0.220', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.850', 'weapon2': '1.042', 'weapon3': '1.302'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:49,532][63767] DAMAGECOUNT value on done: 1012.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:49,910][63767] DAMAGECOUNT value on done: 1309.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:49,910][63767] Sum rewards: -5.008, reward structure: {'DEATHCOUNT': '-6.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.115', 'AMMO5': '0.007', 'AMMO2': '0.018', 'ARMOR': '0.040', 'HITCOUNT': '0.040', 'weapon5': '0.040', 'weapon4': '0.072', 'AMMO4': '0.088', 'AMMO3': '0.099', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.135', 'WEAPON5': '0.150', 'WEAPON3': '0.500', 'weapon2': '0.932', 'weapon3': '1.386'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:52,458][109198] Fps is (10 sec: 11878.4, 60 sec: 11605.3, 300 sec: 11399.4). Total num frames: 4190208. Throughput: 0: 1616.2, 1: 1272.1. Samples: 1042360. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:52,460][109198] Avg episode reward: [(0, '-5.922'), (1, '-5.427')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:53,021][63767] DAMAGECOUNT value on done: 1980.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:53,115][63805] DAMAGECOUNT value on done: 881.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:53,115][63805] Sum rewards: -8.924, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.412', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.003', 'weapon4': '0.004', 'AMMO2': '0.016', 'ARMOR': '0.036', 'weapon6': '0.046', 'weapon5': '0.046', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.077', 'HITCOUNT': '0.090', 'AMMO3': '0.140', 'AMMO6': '0.198', 'AMMO7': '0.198', 'WEAPON6': '0.200', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.800', 'weapon3': '0.902', 'weapon2': '1.582'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:53,389][63767] DAMAGECOUNT value on done: 1618.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:53,389][63767] Sum rewards: -4.987, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.807', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO2': '0.013', 'ARMOR': '0.032', 'AMMO4': '0.062', 'WEAPON5': '0.100', 'AMMO3': '0.137', 'HITCOUNT': '0.140', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.750', 'weapon2': '1.050', 'weapon3': '1.840'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:53,437][63805] DAMAGECOUNT value on done: 1269.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:53,437][63805] Sum rewards: -10.534, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.222', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.019', 'ARMOR': '0.024', 'weapon4': '0.046', 'HITCOUNT': '0.070', 'AMMO4': '0.095', 'WEAPON5': '0.100', 'AMMO3': '0.134', 'DAMAGECOUNT': '0.195', 'WEAPON4': '0.200', 'WEAPON3': '0.650', 'weapon3': '0.808', 'FRAGCOUNT': '1.000', 'weapon2': '1.832'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:53,733][63771] DAMAGECOUNT value on done: 1246.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:53,733][63771] Sum rewards: -10.158, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.575', 'FRAGCOUNT': '-1.500', 'AMMO2': '0.004', 'AMMO5': '0.010', 'weapon5': '0.018', 'AMMO4': '0.019', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'HITCOUNT': '0.040', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.123', 'weapon4': '0.188', 'WEAPON5': '0.200', 'AMMO3': '0.220', 'weapon3': '1.066', 'WEAPON3': '1.100', 'weapon2': '1.270'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:54,108][63771] DAMAGECOUNT value on done: 1598.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:54,109][63771] Sum rewards: -2.524, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.130', 'AMMO5': '0.005', 'AMMO2': '0.006', 'weapon5': '0.022', 'AMMO4': '0.031', 'ARMOR': '0.036', 'AMMO3': '0.098', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'HITCOUNT': '0.210', 'weapon4': '0.262', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.846', 'weapon3': '1.152', 'weapon2': '1.288', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:54,260][63732] Updated weights for policy 0, policy_version 490 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:55,560][63733] Updated weights for policy 1, policy_version 540 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:56,794][63770] DAMAGECOUNT value on done: 1111.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:56,795][63770] Sum rewards: 2.252, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.460', 'AMMO5': '0.005', 'AMMO2': '0.024', 'weapon5': '0.044', 'ARMOR': '0.050', 'AMMO3': '0.092', 'WEAPON5': '0.100', 'AMMO4': '0.121', 'weapon4': '0.126', 'WEAPON4': '0.150', 'HITCOUNT': '0.310', 'WEAPON3': '0.550', 'weapon2': '1.032', 'DAMAGECOUNT': '1.065', 'weapon3': '1.542', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:57,125][63770] DAMAGECOUNT value on done: 976.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:57,235][63771] DAMAGECOUNT value on done: 990.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:57,236][63771] Sum rewards: -8.750, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.207', 'AMMO2': '0.002', 'AMMO5': '0.007', 'ARMOR': '0.008', 'AMMO4': '0.010', 'HITCOUNT': '0.020', 'weapon5': '0.052', 'DAMAGECOUNT': '0.060', 'WEAPON5': '0.100', 'AMMO3': '0.167', 'WEAPON3': '0.900', 'weapon2': '1.014', 'weapon3': '1.366'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:57,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11537.1, 300 sec: 11399.4). Total num frames: 4247552. Throughput: 0: 1624.1, 1: 1273.8. Samples: 1059781. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:42:57,460][109198] Avg episode reward: [(0, '-5.809'), (1, '-5.572')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:57,467][63454] Saving new best policy, reward=-5.809!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:57,595][63771] DAMAGECOUNT value on done: 1276.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:57,626][63769] DAMAGECOUNT value on done: 1511.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:57,627][63769] Sum rewards: -1.433, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.222', 'AMMO5': '0.007', 'AMMO2': '0.010', 'WEAPON1': '0.020', 'weapon5': '0.030', 'AMMO4': '0.051', 'WEAPON5': '0.100', 'AMMO3': '0.111', 'HITCOUNT': '0.120', 'WEAPON4': '0.150', 'weapon4': '0.164', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.700', 'weapon2': '0.918', 'weapon3': '1.400', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:42:58,008][63769] DAMAGECOUNT value on done: 808.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:00,159][63806] DAMAGECOUNT value on done: 1518.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:00,159][63806] Sum rewards: -0.143, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.292', 'AMMO5': '0.010', 'weapon5': '0.012', 'AMMO2': '0.015', 'weapon4': '0.022', 'HITCOUNT': '0.060', 'AMMO4': '0.076', 'ARMOR': '0.084', 'weapon7': '0.084', 'AMMO3': '0.091', 'WEAPON5': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.657', 'weapon2': '1.250', 'weapon3': '1.448', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:00,462][63806] DAMAGECOUNT value on done: 1610.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:00,463][63806] Sum rewards: -2.034, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.648', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'weapon5': '0.026', 'AMMO2': '0.026', 'HITCOUNT': '0.050', 'ARMOR': '0.072', 'weapon7': '0.078', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.128', 'AMMO4': '0.130', 'WEAPON4': '0.250', 'WEAPON5': '0.300', 'weapon4': '0.354', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.700', 'weapon3': '0.972', 'FRAGCOUNT': '1.000', 'weapon2': '1.182'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:00,507][63806] DAMAGECOUNT value on done: 922.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:00,508][63806] Sum rewards: -9.072, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.950', 'AMMO2': '0.010', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.047', 'ARMOR': '0.076', 'weapon5': '0.082', 'WEAPON4': '0.100', 'weapon4': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.165', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.327', 'WEAPON3': '0.900', 'weapon2': '1.216', 'weapon3': '1.224', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:00,614][63732] Updated weights for policy 0, policy_version 500 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:00,845][63806] DAMAGECOUNT value on done: 1368.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:00,846][63806] Sum rewards: -4.365, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.480', 'AMMO5': '0.010', 'weapon5': '0.026', 'AMMO2': '0.034', 'weapon7': '0.058', 'AMMO3': '0.089', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO4': '0.169', 'WEAPON3': '0.400', 'WEAPON4': '0.450', 'weapon4': '0.486', 'DAMAGECOUNT': '0.585', 'weapon3': '0.616', 'weapon2': '1.432', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:02,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11468.8, 300 sec: 11385.5). Total num frames: 4300800. Throughput: 0: 1618.4, 1: 1270.5. Samples: 1068271. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:02,460][109198] Avg episode reward: [(0, '-5.679'), (1, '-5.557')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:02,461][63454] Saving new best policy, reward=-5.679!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:03,694][63733] Updated weights for policy 1, policy_version 550 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:07,007][63732] Updated weights for policy 0, policy_version 510 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:07,364][63735] DAMAGECOUNT value on done: 1942.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:07,365][63735] Sum rewards: -1.330, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.405', 'AMMO2': '0.010', 'AMMO5': '0.011', 'weapon5': '0.034', 'AMMO4': '0.048', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO3': '0.091', 'weapon4': '0.116', 'HITCOUNT': '0.180', 'WEAPON5': '0.250', 'WEAPON3': '0.550', 'weapon2': '1.140', 'DAMAGECOUNT': '1.143', 'weapon3': '1.388', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:07,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11537.1, 300 sec: 11385.5). Total num frames: 4358144. Throughput: 0: 1613.4, 1: 1265.9. Samples: 1085360. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:07,460][109198] Avg episode reward: [(0, '-5.679'), (1, '-5.538')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:07,731][63735] DAMAGECOUNT value on done: 1750.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:07,731][63735] Sum rewards: -6.211, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.038', 'AMMO5': '0.005', 'AMMO2': '0.032', 'HITCOUNT': '0.080', 'WEAPON5': '0.100', 'AMMO3': '0.150', 'AMMO4': '0.159', 'WEAPON4': '0.250', 'weapon4': '0.250', 'DAMAGECOUNT': '0.381', 'ARMOR': '0.488', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.236', 'weapon3': '1.246'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:07,956][63770] DAMAGECOUNT value on done: 622.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:08,348][63770] DAMAGECOUNT value on done: 1517.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:08,349][63770] Sum rewards: -3.183, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.524', 'AMMO2': '0.017', 'AMMO4': '0.083', 'AMMO3': '0.105', 'ARMOR': '0.108', 'HITCOUNT': '0.150', 'weapon4': '0.200', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.600', 'weapon3': '1.226', 'weapon2': '1.352', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:09,604][63734] DAMAGECOUNT value on done: 1487.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:09,949][63734] DAMAGECOUNT value on done: 1614.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:10,565][63805] DAMAGECOUNT value on done: 1325.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:10,881][63735] DAMAGECOUNT value on done: 1085.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:10,882][63735] Sum rewards: -6.424, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.720', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.024', 'HITCOUNT': '0.030', 'ARMOR': '0.040', 'AMMO3': '0.083', 'DAMAGECOUNT': '0.090', 'WEAPON5': '0.100', 'AMMO4': '0.120', 'WEAPON4': '0.250', 'weapon4': '0.394', 'WEAPON3': '0.450', 'weapon3': '0.846', 'FRAGCOUNT': '1.000', 'weapon2': '1.604'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:10,934][63805] DAMAGECOUNT value on done: 1890.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:10,935][63805] Sum rewards: -4.485, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.904', 'AMMO5': '0.012', 'weapon5': '0.016', 'AMMO2': '0.026', 'weapon7': '0.064', 'ARMOR': '0.068', 'AMMO4': '0.128', 'weapon4': '0.130', 'AMMO3': '0.132', 'HITCOUNT': '0.150', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.735', 'WEAPON3': '0.800', 'weapon2': '1.256', 'weapon3': '1.432', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:11,063][63734] DAMAGECOUNT value on done: 1024.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:11,064][63734] Sum rewards: -2.125, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO5': '0.008', 'AMMO2': '0.021', 'ARMOR': '0.036', 'AMMO3': '0.075', 'weapon5': '0.096', 'HITCOUNT': '0.100', 'AMMO4': '0.107', 'HEALTH': '0.138', 'WEAPON5': '0.150', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.252', 'WEAPON3': '0.400', 'weapon4': '0.468', 'FRAGCOUNT': '0.500', 'weapon3': '0.764', 'weapon2': '1.260'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:11,281][63735] DAMAGECOUNT value on done: 1176.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:11,472][63734] DAMAGECOUNT value on done: 968.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:11,473][63734] Sum rewards: -7.987, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.800', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.003', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'AMMO4': '0.046', 'WEAPON5': '0.050', 'ARMOR': '0.052', 'weapon5': '0.062', 'HITCOUNT': '0.080', 'AMMO3': '0.115', 'WEAPON4': '0.150', 'weapon4': '0.210', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.650', 'weapon3': '0.652', 'weapon2': '1.704'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:11,773][63733] Updated weights for policy 1, policy_version 560 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:12,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11537.1, 300 sec: 11399.4). Total num frames: 4415488. Throughput: 0: 1615.4, 1: 1264.8. Samples: 1102685. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:12,459][109198] Avg episode reward: [(0, '-5.530'), (1, '-5.504')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:12,461][63454] Saving new best policy, reward=-5.530!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:12,608][63767] DAMAGECOUNT value on done: 1143.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:12,609][63767] Sum rewards: -3.563, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.780', 'AMMO2': '0.011', 'AMMO5': '0.018', 'WEAPON1': '0.040', 'AMMO4': '0.057', 'weapon4': '0.062', 'ARMOR': '0.080', 'HITCOUNT': '0.100', 'weapon5': '0.100', 'AMMO3': '0.110', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.393', 'WEAPON5': '0.400', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.198', 'weapon3': '1.248'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:13,004][63767] DAMAGECOUNT value on done: 1314.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:13,005][63767] Sum rewards: -6.913, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.643', 'AMMO5': '0.003', 'weapon5': '0.008', 'AMMO2': '0.009', 'HITCOUNT': '0.010', 'DAMAGECOUNT': '0.015', 'ARMOR': '0.040', 'AMMO4': '0.045', 'WEAPON5': '0.050', 'WEAPON4': '0.100', 'AMMO3': '0.106', 'weapon4': '0.180', 'WEAPON3': '0.450', 'weapon3': '0.884', 'weapon2': '1.580'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:13,192][63769] DAMAGECOUNT value on done: 1236.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:13,356][63732] Updated weights for policy 0, policy_version 520 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:13,624][63769] DAMAGECOUNT value on done: 1150.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:13,624][63769] Sum rewards: -0.859, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.430', 'AMMO5': '0.003', 'HITCOUNT': '0.010', 'AMMO2': '0.020', 'WEAPON1': '0.020', 'ARMOR': '0.050', 'weapon5': '0.066', 'AMMO3': '0.079', 'AMMO4': '0.097', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.180', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.400', 'weapon3': '0.994', 'FRAGCOUNT': '1.000', 'weapon2': '1.342'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:15,604][63805] DAMAGECOUNT value on done: 1066.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:15,605][63805] Sum rewards: -6.721, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.684', 'weapon5': '0.002', 'AMMO5': '0.005', 'ARMOR': '0.025', 'AMMO2': '0.026', 'WEAPON5': '0.100', 'AMMO4': '0.127', 'HITCOUNT': '0.150', 'AMMO3': '0.177', 'weapon4': '0.184', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.750', 'weapon2': '1.276', 'weapon3': '1.336', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:15,756][63767] DAMAGECOUNT value on done: 2015.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:15,997][63805] DAMAGECOUNT value on done: 1499.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:15,997][63805] Sum rewards: -6.193, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.295', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'ARMOR': '0.020', 'weapon5': '0.040', 'WEAPON4': '0.050', 'weapon4': '0.080', 'AMMO3': '0.092', 'HITCOUNT': '0.120', 'WEAPON5': '0.250', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.690', 'weapon3': '0.908', 'weapon2': '1.336', 'FRAGCOUNT': '1.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:16,125][63767] DAMAGECOUNT value on done: 1648.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:16,126][63767] Sum rewards: -5.379, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.290', 'AMMO5': '0.003', 'AMMO2': '0.005', 'weapon5': '0.006', 'AMMO4': '0.027', 'HITCOUNT': '0.030', 'WEAPON5': '0.050', 'DAMAGECOUNT': '0.090', 'AMMO3': '0.160', 'WEAPON3': '0.800', 'weapon2': '0.870', 'FRAGCOUNT': '1.000', 'weapon3': '1.620'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:17,458][109198] Fps is (10 sec: 11878.5, 60 sec: 11605.3, 300 sec: 11399.4). Total num frames: 4476928. Throughput: 0: 1615.6, 1: 1263.5. Samples: 1111328. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:17,460][109198] Avg episode reward: [(0, '-5.486'), (1, '-5.541')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:17,465][63454] Saving new best policy, reward=-5.486!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:18,850][63771] DAMAGECOUNT value on done: 1276.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:19,280][63771] DAMAGECOUNT value on done: 1886.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:19,281][63771] Sum rewards: -7.162, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.760', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO4': '0.027', 'ARMOR': '0.032', 'weapon5': '0.044', 'WEAPON5': '0.100', 'HITCOUNT': '0.120', 'weapon4': '0.164', 'WEAPON4': '0.200', 'AMMO3': '0.203', 'DAMAGECOUNT': '0.864', 'WEAPON3': '1.050', 'weapon3': '1.340', 'weapon2': '1.444', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:19,644][63732] Updated weights for policy 0, policy_version 530 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:19,767][63770] DAMAGECOUNT value on done: 1288.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:19,957][63733] Updated weights for policy 1, policy_version 570 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:20,080][63770] DAMAGECOUNT value on done: 1141.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:20,344][63771] DAMAGECOUNT value on done: 1050.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:20,344][63771] Sum rewards: -10.177, reward structure: {'DEATHCOUNT': '-11.250', 'FRAGCOUNT': '-2.000', 'HEALTH': '-0.968', 'AMMO5': '0.007', 'AMMO2': '0.010', 'HITCOUNT': '0.050', 'AMMO4': '0.051', 'weapon5': '0.070', 'WEAPON5': '0.150', 'AMMO3': '0.157', 'DAMAGECOUNT': '0.180', 'weapon2': '0.888', 'WEAPON3': '0.900', 'weapon3': '1.578'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:20,614][63769] DAMAGECOUNT value on done: 1671.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:20,614][63769] Sum rewards: -6.698, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.390', 'AMMO2': '0.013', 'weapon4': '0.024', 'AMMO4': '0.065', 'AMMO3': '0.110', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.116', 'weapon2': '1.534'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:20,715][63771] DAMAGECOUNT value on done: 1326.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:20,715][63771] Sum rewards: -4.602, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.840', 'AMMO4': '-0.024', 'AMMO2': '-0.005', 'HITCOUNT': '0.060', 'DAMAGECOUNT': '0.150', 'AMMO3': '0.183', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.182', 'weapon3': '1.442'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:20,991][63769] DAMAGECOUNT value on done: 951.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:20,992][63769] Sum rewards: -6.496, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.094', 'AMMO2': '0.012', 'ARMOR': '0.052', 'AMMO4': '0.059', 'HITCOUNT': '0.090', 'AMMO3': '0.124', 'WEAPON4': '0.150', 'weapon4': '0.284', 'DAMAGECOUNT': '0.429', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.084', 'weapon3': '1.164'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:22,458][109198] Fps is (10 sec: 11878.4, 60 sec: 11605.3, 300 sec: 11413.3). Total num frames: 4534272. Throughput: 0: 1615.4, 1: 1262.7. Samples: 1128621. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:22,460][109198] Avg episode reward: [(0, '-5.497'), (1, '-5.552')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:22,691][63806] DAMAGECOUNT value on done: 1533.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:23,008][63806] DAMAGECOUNT value on done: 1883.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:23,009][63806] Sum rewards: 1.081, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.777', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'AMMO5': '0.013', 'weapon4': '0.038', 'AMMO4': '0.053', 'weapon5': '0.054', 'AMMO3': '0.082', 'WEAPON4': '0.100', 'HITCOUNT': '0.150', 'WEAPON5': '0.250', 'WEAPON3': '0.450', 'ARMOR': '0.493', 'DAMAGECOUNT': '0.819', 'weapon2': '1.146', 'weapon3': '1.440', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:23,058][63806] DAMAGECOUNT value on done: 1042.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:23,058][63806] Sum rewards: -2.259, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.005', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'ARMOR': '0.012', 'HEALTH': '0.018', 'AMMO4': '0.040', 'weapon5': '0.050', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.129', 'HITCOUNT': '0.130', 'weapon4': '0.194', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.600', 'weapon2': '0.908', 'FRAGCOUNT': '1.000', 'weapon3': '1.576'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:23,406][63806] DAMAGECOUNT value on done: 1418.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:25,955][63732] Updated weights for policy 0, policy_version 540 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:27,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11537.1, 300 sec: 11427.1). Total num frames: 4591616. Throughput: 0: 1617.3, 1: 1261.7. Samples: 1145982. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:27,460][109198] Avg episode reward: [(0, '-5.485'), (1, '-5.552')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:27,941][63733] Updated weights for policy 1, policy_version 580 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:29,680][63735] DAMAGECOUNT value on done: 2047.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:29,680][63735] Sum rewards: -5.926, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.514', 'AMMO5': '0.005', 'AMMO2': '0.038', 'ARMOR': '0.048', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.174', 'AMMO4': '0.192', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.315', 'weapon4': '0.426', 'WEAPON3': '0.850', 'weapon2': '0.918', 'weapon3': '1.412', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:30,005][63735] DAMAGECOUNT value on done: 1990.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:30,006][63735] Sum rewards: -5.739, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.486', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.011', 'weapon4': '0.022', 'ARMOR': '0.032', 'WEAPON4': '0.100', 'HITCOUNT': '0.170', 'AMMO3': '0.217', 'DAMAGECOUNT': '0.720', 'WEAPON3': '1.000', 'weapon2': '1.292', 'weapon3': '1.426', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:30,799][63770] DAMAGECOUNT value on done: 1104.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:30,799][63770] Sum rewards: 1.594, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.596', 'WEAPON1': '0.010', 'AMMO5': '0.016', 'AMMO2': '0.017', 'ARMOR': '0.056', 'AMMO3': '0.083', 'AMMO4': '0.083', 'WEAPON4': '0.100', 'weapon4': '0.180', 'weapon5': '0.224', 'HITCOUNT': '0.260', 'WEAPON5': '0.350', 'WEAPON3': '0.450', 'weapon3': '0.864', 'DAMAGECOUNT': '1.446', 'weapon2': '1.550', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:31,171][63770] DAMAGECOUNT value on done: 1686.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:31,172][63770] Sum rewards: -5.726, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.814', 'WEAPON1': '0.010', 'ARMOR': '0.024', 'AMMO2': '0.026', 'weapon4': '0.064', 'AMMO3': '0.111', 'AMMO4': '0.130', 'HITCOUNT': '0.150', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.178', 'weapon2': '1.538'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:32,222][63732] Updated weights for policy 0, policy_version 550 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:32,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11537.1, 300 sec: 11427.2). Total num frames: 4648960. Throughput: 0: 1618.1, 1: 1261.9. Samples: 1154634. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:32,460][109198] Avg episode reward: [(0, '-5.407'), (1, '-5.597')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:32,461][63454] Saving new best policy, reward=-5.407!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:33,731][63805] DAMAGECOUNT value on done: 1349.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:33,732][63805] Sum rewards: -9.418, reward structure: {'DEATHCOUNT': '-11.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.074', 'AMMO2': '0.005', 'ARMOR': '0.016', 'AMMO5': '0.019', 'WEAPON1': '0.020', 'AMMO4': '0.026', 'HITCOUNT': '0.040', 'WEAPON4': '0.050', 'weapon4': '0.060', 'DAMAGECOUNT': '0.072', 'weapon5': '0.082', 'AMMO3': '0.167', 'WEAPON5': '0.350', 'WEAPON3': '0.800', 'weapon3': '1.156', 'weapon2': '1.542'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:34,079][63805] DAMAGECOUNT value on done: 2070.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:34,751][63734] DAMAGECOUNT value on done: 1139.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:34,751][63734] Sum rewards: -6.380, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.398', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'WEAPON1': '0.010', 'AMMO5': '0.024', 'HITCOUNT': '0.080', 'weapon5': '0.100', 'AMMO3': '0.133', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.345', 'WEAPON3': '0.700', 'ARMOR': '0.908', 'weapon2': '1.278', 'weapon3': '1.672'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:34,842][63734] DAMAGECOUNT value on done: 1754.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:34,843][63734] Sum rewards: -4.059, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.480', 'AMMO5': '0.003', 'AMMO2': '0.035', 'WEAPON5': '0.050', 'ARMOR': '0.060', 'AMMO3': '0.117', 'AMMO4': '0.177', 'HITCOUNT': '0.200', 'weapon4': '0.438', 'WEAPON4': '0.450', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.801', 'weapon3': '0.996', 'weapon2': '1.444', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:35,124][63735] DAMAGECOUNT value on done: 1164.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:35,125][63735] Sum rewards: -3.542, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.672', 'AMMO5': '0.015', 'AMMO2': '0.025', 'HITCOUNT': '0.060', 'ARMOR': '0.064', 'WEAPON5': '0.100', 'AMMO3': '0.111', 'AMMO4': '0.124', 'DAMAGECOUNT': '0.237', 'WEAPON4': '0.400', 'weapon4': '0.438', 'WEAPON3': '0.600', 'weapon3': '0.704', 'FRAGCOUNT': '1.000', 'weapon2': '1.752'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:35,156][63734] DAMAGECOUNT value on done: 1355.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:35,157][63734] Sum rewards: -0.758, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.277', 'AMMO5': '0.003', 'ARMOR': '0.004', 'AMMO2': '0.008', 'AMMO4': '0.039', 'weapon4': '0.042', 'WEAPON5': '0.050', 'weapon7': '0.054', 'AMMO3': '0.096', 'WEAPON4': '0.150', 'AMMO6': '0.160', 'AMMO7': '0.160', 'HITCOUNT': '0.190', 'WEAPON7': '0.200', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.125', 'weapon3': '1.298', 'weapon2': '1.340'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:35,264][63734] DAMAGECOUNT value on done: 1767.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:35,264][63734] Sum rewards: -4.062, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.060', 'AMMO4': '-0.029', 'AMMO2': '-0.006', 'AMMO5': '0.005', 'ARMOR': '0.040', 'WEAPON5': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.165', 'DAMAGECOUNT': '0.459', 'WEAPON3': '0.800', 'weapon2': '1.074', 'weapon3': '1.500', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:35,573][63767] DAMAGECOUNT value on done: 1335.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:35,574][63767] Sum rewards: -4.298, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.036', 'AMMO5': '0.009', 'AMMO2': '0.020', 'WEAPON1': '0.040', 'weapon5': '0.088', 'WEAPON5': '0.100', 'AMMO4': '0.100', 'AMMO3': '0.123', 'HITCOUNT': '0.150', 'weapon4': '0.202', 'WEAPON4': '0.300', 'ARMOR': '0.404', 'DAMAGECOUNT': '0.576', 'WEAPON3': '0.700', 'weapon3': '0.788', 'weapon2': '1.888', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:35,574][63735] DAMAGECOUNT value on done: 1335.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:35,575][63735] Sum rewards: -3.408, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.069', 'AMMO2': '0.007', 'ARMOR': '0.028', 'AMMO4': '0.037', 'weapon4': '0.096', 'WEAPON4': '0.100', 'AMMO3': '0.126', 'HITCOUNT': '0.140', 'DAMAGECOUNT': '0.477', 'WEAPON3': '0.650', 'weapon2': '0.964', 'FRAGCOUNT': '1.000', 'weapon3': '1.536'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:35,908][63767] DAMAGECOUNT value on done: 1498.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:35,909][63767] Sum rewards: -4.694, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.683', 'AMMO2': '0.004', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.020', 'ARMOR': '0.028', 'weapon5': '0.058', 'HITCOUNT': '0.140', 'AMMO3': '0.173', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.552', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.292', 'weapon3': '1.486'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:36,072][63733] Updated weights for policy 1, policy_version 590 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:37,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11537.1, 300 sec: 11427.1). Total num frames: 4706304. Throughput: 0: 1618.7, 1: 1262.7. Samples: 1172023. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:37,460][109198] Avg episode reward: [(0, '-5.311'), (1, '-5.581')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:37,466][63454] Saving new best policy, reward=-5.311!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:38,145][63767] DAMAGECOUNT value on done: 2144.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:38,145][63767] Sum rewards: -2.630, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.080', 'AMMO5': '0.003', 'AMMO2': '0.003', 'weapon5': '0.006', 'ARMOR': '0.008', 'AMMO4': '0.015', 'WEAPON5': '0.050', 'HITCOUNT': '0.110', 'AMMO3': '0.138', 'DAMAGECOUNT': '0.387', 'WEAPON3': '0.800', 'weapon2': '0.886', 'weapon3': '1.544', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:38,332][63769] DAMAGECOUNT value on done: 1326.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:38,333][63769] Sum rewards: -3.458, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.552', 'AMMO2': '0.020', 'HITCOUNT': '0.080', 'ARMOR': '0.088', 'WEAPON4': '0.100', 'AMMO4': '0.101', 'AMMO3': '0.119', 'DAMAGECOUNT': '0.270', 'weapon4': '0.352', 'WEAPON3': '0.700', 'weapon3': '0.838', 'FRAGCOUNT': '1.000', 'weapon2': '1.176'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:38,396][63805] DAMAGECOUNT value on done: 1131.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:38,537][63767] DAMAGECOUNT value on done: 1707.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:38,632][63732] Updated weights for policy 0, policy_version 560 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:38,768][63805] DAMAGECOUNT value on done: 1519.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:38,784][63769] DAMAGECOUNT value on done: 1258.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:42,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11537.1, 300 sec: 11441.0). Total num frames: 4763648. Throughput: 0: 1615.9, 1: 1261.7. Samples: 1189276. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:42,460][109198] Avg episode reward: [(0, '-5.292'), (1, '-5.499')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:42,461][63454] Saving new best policy, reward=-5.292!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:42,667][63770] DAMAGECOUNT value on done: 1408.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:43,038][63770] DAMAGECOUNT value on done: 1221.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:43,045][63771] DAMAGECOUNT value on done: 1070.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:43,425][63771] DAMAGECOUNT value on done: 1340.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:43,701][63771] DAMAGECOUNT value on done: 1415.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:43,753][63769] DAMAGECOUNT value on done: 1771.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:44,034][63771] DAMAGECOUNT value on done: 2066.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:44,035][63771] Sum rewards: -3.717, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.804', 'AMMO2': '0.015', 'ARMOR': '0.052', 'AMMO4': '0.074', 'weapon4': '0.098', 'WEAPON4': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.196', 'DAMAGECOUNT': '0.540', 'weapon2': '1.060', 'WEAPON3': '1.100', 'weapon3': '1.462', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:44,107][63733] Updated weights for policy 1, policy_version 600 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:44,136][63769] DAMAGECOUNT value on done: 1141.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:44,136][63769] Sum rewards: -5.166, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.885', 'AMMO4': '-0.020', 'AMMO2': '-0.004', 'weapon5': '0.004', 'AMMO5': '0.010', 'ARMOR': '0.032', 'WEAPON5': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.165', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.850', 'weapon2': '1.288', 'weapon3': '1.334', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:44,925][63732] Updated weights for policy 0, policy_version 570 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:45,106][63806] DAMAGECOUNT value on done: 1738.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:45,106][63806] Sum rewards: -0.396, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.771', 'WEAPON1': '0.010', 'AMMO5': '0.018', 'AMMO2': '0.028', 'weapon7': '0.032', 'ARMOR': '0.072', 'weapon4': '0.084', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'weapon5': '0.102', 'AMMO3': '0.122', 'AMMO4': '0.140', 'HITCOUNT': '0.180', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.615', 'WEAPON3': '0.700', 'weapon3': '1.290', 'weapon2': '1.382', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:45,401][63806] DAMAGECOUNT value on done: 1971.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:45,402][63806] Sum rewards: -10.115, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-3.288', 'AMMO2': '0.020', 'AMMO5': '0.020', 'HITCOUNT': '0.030', 'WEAPON1': '0.040', 'weapon4': '0.084', 'AMMO4': '0.099', 'weapon5': '0.114', 'AMMO3': '0.202', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.264', 'WEAPON5': '0.300', 'ARMOR': '0.436', 'FRAGCOUNT': '1.000', 'weapon3': '1.066', 'WEAPON3': '1.150', 'weapon2': '1.598'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:45,479][63806] DAMAGECOUNT value on done: 1135.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:45,480][63806] Sum rewards: -10.285, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.628', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.012', 'AMMO2': '0.013', 'AMMO4': '0.066', 'HITCOUNT': '0.100', 'weapon5': '0.138', 'AMMO3': '0.143', 'DAMAGECOUNT': '0.279', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon4': '0.358', 'ARMOR': '0.447', 'WEAPON3': '0.800', 'weapon3': '1.090', 'weapon2': '1.546'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:45,783][63806] DAMAGECOUNT value on done: 1558.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:47,458][109198] Fps is (10 sec: 11878.4, 60 sec: 11537.1, 300 sec: 11454.9). Total num frames: 4825088. Throughput: 0: 1619.4, 1: 1263.5. Samples: 1198002. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:47,460][109198] Avg episode reward: [(0, '-5.368'), (1, '-5.576')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:51,180][63732] Updated weights for policy 0, policy_version 580 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:51,839][63735] DAMAGECOUNT value on done: 2092.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:51,839][63735] Sum rewards: -9.337, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.140', 'AMMO2': '0.023', 'ARMOR': '0.068', 'HITCOUNT': '0.070', 'AMMO4': '0.113', 'DAMAGECOUNT': '0.135', 'AMMO3': '0.180', 'weapon4': '0.202', 'WEAPON4': '0.250', 'WEAPON3': '0.750', 'weapon3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.112'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:52,192][63733] Updated weights for policy 1, policy_version 610 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:52,250][63735] DAMAGECOUNT value on done: 2070.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:52,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11468.8, 300 sec: 11427.1). Total num frames: 4878336. Throughput: 0: 1624.0, 1: 1264.6. Samples: 1215347. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:52,460][109198] Avg episode reward: [(0, '-5.368'), (1, '-5.597')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:53,682][63770] DAMAGECOUNT value on done: 1180.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:53,682][63770] Sum rewards: 0.278, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.040', 'AMMO5': '0.007', 'AMMO2': '0.012', 'WEAPON1': '0.030', 'weapon5': '0.042', 'AMMO4': '0.062', 'HITCOUNT': '0.080', 'AMMO3': '0.090', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.228', 'ARMOR': '0.500', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon2': '1.320', 'weapon3': '1.546'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:54,025][63770] DAMAGECOUNT value on done: 1738.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:56,844][63805] DAMAGECOUNT value on done: 1469.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:56,845][63805] Sum rewards: -7.595, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.982', 'ARMOR': '0.004', 'AMMO5': '0.007', 'AMMO2': '0.011', 'AMMO4': '0.053', 'HITCOUNT': '0.070', 'weapon5': '0.072', 'AMMO3': '0.134', 'WEAPON5': '0.150', 'WEAPON4': '0.300', 'weapon4': '0.340', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.238', 'weapon2': '1.348'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:57,202][63805] DAMAGECOUNT value on done: 2153.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:57,202][63805] Sum rewards: -11.089, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-1.635', 'FRAGCOUNT': '-1.500', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'AMMO2': '0.041', 'weapon5': '0.062', 'HITCOUNT': '0.090', 'AMMO3': '0.091', 'AMMO4': '0.207', 'weapon4': '0.214', 'DAMAGECOUNT': '0.249', 'WEAPON5': '0.250', 'WEAPON4': '0.400', 'weapon3': '0.406', 'WEAPON3': '0.500', 'ARMOR': '0.534', 'weapon2': '2.476'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:57,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11468.8, 300 sec: 11441.0). Total num frames: 4935680. Throughput: 0: 1624.3, 1: 1267.8. Samples: 1232829. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:43:57,460][109198] Avg episode reward: [(0, '-5.405'), (1, '-5.597')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:57,491][63732] Updated weights for policy 0, policy_version 590 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:58,231][63734] DAMAGECOUNT value on done: 1369.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:58,232][63734] Sum rewards: -3.738, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.238', 'AMMO5': '0.005', 'AMMO2': '0.009', 'AMMO4': '0.045', 'WEAPON5': '0.050', 'AMMO3': '0.068', 'weapon7': '0.086', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.150', 'HITCOUNT': '0.150', 'WEAPON7': '0.200', 'weapon4': '0.294', 'ARMOR': '0.440', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.690', 'FRAGCOUNT': '1.000', 'weapon3': '1.030', 'weapon2': '1.592'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:58,486][63767] DAMAGECOUNT value on done: 1565.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:58,487][63767] Sum rewards: -3.091, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.724', 'AMMO5': '0.016', 'AMMO2': '0.024', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'AMMO4': '0.118', 'weapon5': '0.124', 'AMMO3': '0.127', 'WEAPON5': '0.250', 'weapon4': '0.342', 'ARMOR': '0.400', 'DAMAGECOUNT': '0.690', 'WEAPON3': '0.700', 'weapon2': '1.076', 'weapon3': '1.326', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:58,587][63734] DAMAGECOUNT value on done: 1490.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:58,870][63767] DAMAGECOUNT value on done: 1590.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:59,538][63735] DAMAGECOUNT value on done: 1327.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:59,539][63735] Sum rewards: -4.172, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.969', 'weapon5': '0.006', 'AMMO2': '0.008', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.040', 'weapon7': '0.074', 'AMMO3': '0.075', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.140', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.252', 'DAMAGECOUNT': '0.489', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.254', 'weapon2': '1.302'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:59,740][63734] DAMAGECOUNT value on done: 1901.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:59,741][63734] Sum rewards: -2.379, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.360', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO2': '0.034', 'weapon5': '0.040', 'AMMO3': '0.075', 'HITCOUNT': '0.080', 'weapon7': '0.102', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO4': '0.169', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.234', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.441', 'WEAPON3': '0.450', 'ARMOR': '0.458', 'weapon3': '0.934', 'FRAGCOUNT': '1.000', 'weapon2': '1.542'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:59,866][63735] DAMAGECOUNT value on done: 1479.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:43:59,867][63735] Sum rewards: -5.456, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.446', 'AMMO2': '0.002', 'AMMO4': '0.011', 'ARMOR': '0.036', 'HITCOUNT': '0.090', 'AMMO3': '0.173', 'DAMAGECOUNT': '0.432', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.158', 'weapon3': '1.238'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:00,134][63734] DAMAGECOUNT value on done: 1977.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:00,135][63734] Sum rewards: -5.770, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.924', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.004', 'weapon5': '0.012', 'AMMO5': '0.013', 'AMMO4': '0.021', 'WEAPON1': '0.030', 'weapon7': '0.036', 'ARMOR': '0.040', 'WEAPON4': '0.100', 'HITCOUNT': '0.130', 'weapon4': '0.132', 'AMMO3': '0.140', 'WEAPON5': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.700', 'weapon2': '1.006', 'weapon3': '1.160'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:00,265][63733] Updated weights for policy 1, policy_version 620 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:00,595][63767] DAMAGECOUNT value on done: 2289.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:00,596][63767] Sum rewards: -0.098, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.007', 'AMMO2': '0.018', 'weapon5': '0.036', 'ARMOR': '0.046', 'HEALTH': '0.060', 'weapon4': '0.064', 'AMMO3': '0.077', 'AMMO4': '0.090', 'HITCOUNT': '0.100', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.450', 'weapon2': '0.754', 'FRAGCOUNT': '1.000', 'weapon3': '1.664'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:00,855][63805] DAMAGECOUNT value on done: 1281.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:00,856][63805] Sum rewards: -6.044, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.040', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.011', 'WEAPON5': '0.050', 'AMMO4': '0.052', 'HITCOUNT': '0.100', 'AMMO3': '0.156', 'ARMOR': '0.416', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.012', 'weapon3': '1.586'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:00,941][63767] DAMAGECOUNT value on done: 1757.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:00,941][63767] Sum rewards: -5.369, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.808', 'AMMO2': '0.010', 'ARMOR': '0.044', 'AMMO4': '0.050', 'WEAPON4': '0.050', 'HITCOUNT': '0.050', 'weapon4': '0.106', 'DAMAGECOUNT': '0.150', 'AMMO3': '0.171', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.080', 'weapon3': '1.128'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:01,238][63805] DAMAGECOUNT value on done: 1634.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:01,238][63805] Sum rewards: -4.396, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.252', 'AMMO2': '0.002', 'AMMO5': '0.010', 'AMMO4': '0.011', 'ARMOR': '0.024', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.158', 'weapon4': '0.172', 'DAMAGECOUNT': '0.345', 'weapon2': '0.926', 'WEAPON3': '0.950', 'weapon3': '1.298', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:02,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11537.1, 300 sec: 11441.0). Total num frames: 4993024. Throughput: 0: 1622.2, 1: 1268.6. Samples: 1241415. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:02,460][109198] Avg episode reward: [(0, '-5.354'), (1, '-5.685')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:03,233][63769] DAMAGECOUNT value on done: 1461.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:03,234][63769] Sum rewards: -4.093, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.826', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'weapon5': '0.020', 'AMMO2': '0.027', 'HITCOUNT': '0.090', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.114', 'AMMO4': '0.136', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.234', 'weapon2': '1.332'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:03,618][63769] DAMAGECOUNT value on done: 1303.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:03,619][63769] Sum rewards: -9.288, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-3.000', 'HEALTH': '-0.830', 'AMMO5': '0.014', 'AMMO2': '0.018', 'weapon5': '0.020', 'ARMOR': '0.035', 'HITCOUNT': '0.040', 'weapon7': '0.066', 'AMMO3': '0.074', 'AMMO4': '0.091', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'DAMAGECOUNT': '0.135', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'weapon4': '0.300', 'WEAPON3': '0.450', 'weapon3': '0.880', 'weapon2': '1.518'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:03,733][63732] Updated weights for policy 0, policy_version 600 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:05,739][63770] DAMAGECOUNT value on done: 1558.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:05,740][63770] Sum rewards: -5.820, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.585', 'AMMO5': '0.005', 'AMMO2': '0.038', 'WEAPON5': '0.100', 'AMMO3': '0.103', 'HITCOUNT': '0.140', 'AMMO4': '0.191', 'weapon4': '0.304', 'WEAPON4': '0.400', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.600', 'weapon2': '0.974', 'FRAGCOUNT': '1.000', 'weapon3': '1.460'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:05,752][63771] DAMAGECOUNT value on done: 1225.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:05,752][63771] Sum rewards: -6.449, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.764', 'AMMO5': '0.005', 'AMMO2': '0.013', 'weapon5': '0.024', 'WEAPON4': '0.050', 'ARMOR': '0.057', 'AMMO4': '0.064', 'weapon4': '0.096', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.181', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.800', 'weapon3': '1.142', 'weapon2': '1.208', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:06,067][63770] DAMAGECOUNT value on done: 1456.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:06,068][63770] Sum rewards: -2.482, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.800', 'AMMO5': '0.010', 'weapon4': '0.016', 'WEAPON1': '0.020', 'AMMO2': '0.021', 'WEAPON4': '0.050', 'AMMO3': '0.056', 'weapon7': '0.088', 'HITCOUNT': '0.100', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO4': '0.106', 'weapon5': '0.178', 'WEAPON5': '0.300', 'WEAPON3': '0.300', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.705', 'weapon3': '0.912', 'weapon2': '1.406'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:06,143][63771] DAMAGECOUNT value on done: 1450.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:06,144][63771] Sum rewards: -2.672, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.852', 'AMMO5': '0.003', 'AMMO2': '0.012', 'weapon5': '0.018', 'WEAPON5': '0.050', 'AMMO4': '0.062', 'ARMOR': '0.077', 'AMMO3': '0.104', 'HITCOUNT': '0.130', 'weapon4': '0.130', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.600', 'weapon3': '0.830', 'weapon2': '1.434', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:06,630][63769] DAMAGECOUNT value on done: 1786.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:07,017][63769] DAMAGECOUNT value on done: 1175.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:07,377][63806] DAMAGECOUNT value on done: 1815.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:07,378][63806] Sum rewards: -6.917, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.152', 'AMMO5': '0.008', 'WEAPON1': '0.020', 'AMMO2': '0.033', 'weapon5': '0.066', 'AMMO3': '0.078', 'HITCOUNT': '0.100', 'AMMO4': '0.165', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.231', 'WEAPON4': '0.400', 'WEAPON3': '0.400', 'weapon4': '0.644', 'weapon3': '0.788', 'ARMOR': '0.892', 'FRAGCOUNT': '1.000', 'weapon2': '1.210'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:07,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11537.1, 300 sec: 11454.9). Total num frames: 5050368. Throughput: 0: 1624.7, 1: 1268.6. Samples: 1258823. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:07,460][109198] Avg episode reward: [(0, '-5.285'), (1, '-5.593')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:07,466][63454] Saving new best policy, reward=-5.285!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:07,738][63806] DAMAGECOUNT value on done: 2029.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:07,782][63806] DAMAGECOUNT value on done: 1285.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:07,783][63806] Sum rewards: -4.671, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.156', 'AMMO5': '0.010', 'AMMO2': '0.020', 'weapon5': '0.044', 'weapon7': '0.058', 'AMMO4': '0.099', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'HITCOUNT': '0.120', 'AMMO3': '0.140', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.254', 'weapon3': '1.640'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:08,111][63806] DAMAGECOUNT value on done: 1998.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:08,112][63806] Sum rewards: -1.085, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.250', 'weapon5': '0.002', 'AMMO5': '0.010', 'AMMO2': '0.013', 'weapon7': '0.016', 'AMMO4': '0.065', 'weapon4': '0.072', 'WEAPON4': '0.100', 'AMMO3': '0.132', 'WEAPON5': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.280', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.020', 'weapon3': '1.060', 'weapon2': '1.394', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:08,354][63733] Updated weights for policy 1, policy_version 630 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:08,519][63771] DAMAGECOUNT value on done: 1530.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:08,520][63771] Sum rewards: -9.316, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.072', 'FRAGCOUNT': '-1.500', 'ARMOR': '0.012', 'AMMO2': '0.024', 'AMMO5': '0.024', 'weapon5': '0.060', 'weapon7': '0.086', 'HITCOUNT': '0.090', 'AMMO4': '0.119', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.132', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.345', 'WEAPON4': '0.350', 'WEAPON5': '0.400', 'weapon4': '0.402', 'WEAPON3': '0.650', 'weapon3': '0.822', 'weapon2': '1.550'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:08,874][63771] DAMAGECOUNT value on done: 2252.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:08,874][63771] Sum rewards: -3.615, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.350', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'weapon4': '0.052', 'AMMO4': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.124', 'HITCOUNT': '0.160', 'DAMAGECOUNT': '0.558', 'WEAPON3': '0.650', 'weapon2': '0.982', 'FRAGCOUNT': '1.000', 'weapon3': '1.330'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:10,232][63732] Updated weights for policy 0, policy_version 610 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:12,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11537.1, 300 sec: 11454.9). Total num frames: 5107712. Throughput: 0: 1614.5, 1: 1264.2. Samples: 1275521. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:12,460][109198] Avg episode reward: [(0, '-5.296'), (1, '-5.569')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:14,103][63735] DAMAGECOUNT value on done: 2182.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:14,103][63735] Sum rewards: -12.481, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-3.855', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.003', 'ARMOR': '0.048', 'WEAPON5': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.204', 'DAMAGECOUNT': '0.270', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.200', 'weapon3': '1.330', 'weapon2': '1.470'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:14,455][63735] DAMAGECOUNT value on done: 2155.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:16,564][63733] Updated weights for policy 1, policy_version 640 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:16,651][63732] Updated weights for policy 0, policy_version 620 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:16,859][63770] DAMAGECOUNT value on done: 1255.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:16,860][63770] Sum rewards: -7.566, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.353', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.031', 'AMMO3': '0.071', 'HITCOUNT': '0.080', 'WEAPON5': '0.100', 'AMMO4': '0.153', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.225', 'weapon4': '0.242', 'WEAPON3': '0.450', 'ARMOR': '0.532', 'weapon3': '1.036', 'weapon2': '1.654'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:17,198][63770] DAMAGECOUNT value on done: 2061.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:17,198][63770] Sum rewards: -7.431, reward structure: {'DEATHCOUNT': '-15.000', 'HEALTH': '-1.288', 'WEAPON1': '0.010', 'weapon5': '0.024', 'AMMO5': '0.025', 'AMMO2': '0.028', 'weapon4': '0.082', 'AMMO4': '0.140', 'AMMO3': '0.200', 'HITCOUNT': '0.230', 'WEAPON5': '0.250', 'WEAPON4': '0.250', 'WEAPON3': '0.950', 'DAMAGECOUNT': '0.969', 'weapon2': '1.182', 'weapon3': '1.516', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:17,458][109198] Fps is (10 sec: 11878.5, 60 sec: 11537.1, 300 sec: 11454.9). Total num frames: 5169152. Throughput: 0: 1615.1, 1: 1264.6. Samples: 1284220. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:17,460][109198] Avg episode reward: [(0, '-5.348'), (1, '-5.627')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:20,192][63805] DAMAGECOUNT value on done: 1489.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:20,569][63805] DAMAGECOUNT value on done: 2233.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:20,570][63805] Sum rewards: -4.580, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.447', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.023', 'AMMO2': '0.027', 'weapon5': '0.034', 'HITCOUNT': '0.080', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.118', 'AMMO4': '0.137', 'DAMAGECOUNT': '0.240', 'WEAPON4': '0.300', 'WEAPON5': '0.350', 'WEAPON3': '0.700', 'weapon4': '0.710', 'weapon3': '0.872', 'ARMOR': '1.034', 'weapon2': '1.442'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:21,661][63767] DAMAGECOUNT value on done: 1760.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:21,661][63767] Sum rewards: -4.441, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.158', 'AMMO5': '0.014', 'ARMOR': '0.016', 'AMMO2': '0.028', 'weapon5': '0.056', 'weapon7': '0.074', 'AMMO3': '0.091', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO4': '0.140', 'HITCOUNT': '0.160', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.585', 'WEAPON3': '0.600', 'weapon2': '1.296', 'weapon3': '1.306'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:21,903][63734] DAMAGECOUNT value on done: 1600.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:21,904][63734] Sum rewards: -0.873, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.550', 'AMMO5': '0.018', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'weapon5': '0.050', 'AMMO4': '0.088', 'AMMO3': '0.092', 'HITCOUNT': '0.140', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.380', 'ARMOR': '0.432', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.693', 'FRAGCOUNT': '1.000', 'weapon2': '1.210', 'weapon3': '1.236'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:22,040][63767] DAMAGECOUNT value on done: 1759.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:22,041][63767] Sum rewards: 0.308, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.910', 'AMMO5': '0.012', 'AMMO2': '0.022', 'WEAPON1': '0.040', 'weapon5': '0.080', 'WEAPON4': '0.100', 'AMMO4': '0.110', 'AMMO3': '0.120', 'HITCOUNT': '0.210', 'weapon4': '0.214', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.550', 'weapon3': '1.148', 'weapon2': '1.354', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:22,300][63734] DAMAGECOUNT value on done: 1734.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:22,458][109198] Fps is (10 sec: 11878.4, 60 sec: 11537.1, 300 sec: 11454.9). Total num frames: 5226496. Throughput: 0: 1616.1, 1: 1264.9. Samples: 1301668. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:22,460][109198] Avg episode reward: [(0, '-5.248'), (1, '-5.627')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:22,461][63454] Saving new best policy, reward=-5.248!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:22,966][63732] Updated weights for policy 0, policy_version 630 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:23,233][63767] DAMAGECOUNT value on done: 2454.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:23,234][63767] Sum rewards: -2.624, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.430', 'WEAPON1': '0.020', 'AMMO2': '0.022', 'weapon7': '0.058', 'AMMO4': '0.110', 'ARMOR': '0.112', 'AMMO3': '0.149', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'AMMO6': '0.160', 'AMMO7': '0.160', 'weapon4': '0.166', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.750', 'weapon2': '0.888', 'FRAGCOUNT': '1.000', 'weapon3': '1.466'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:23,605][63805] DAMAGECOUNT value on done: 1330.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:23,606][63805] Sum rewards: -7.431, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.406', 'AMMO2': '0.005', 'AMMO4': '0.023', 'HITCOUNT': '0.060', 'AMMO3': '0.130', 'DAMAGECOUNT': '0.147', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.184', 'weapon3': '1.676'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:23,622][63767] DAMAGECOUNT value on done: 1882.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:23,622][63767] Sum rewards: -6.125, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.712', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.007', 'AMMO5': '0.007', 'AMMO4': '0.034', 'WEAPON4': '0.050', 'weapon5': '0.072', 'HITCOUNT': '0.110', 'weapon4': '0.130', 'AMMO3': '0.144', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.900', 'weapon2': '0.976', 'weapon3': '1.332'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:23,975][63805] DAMAGECOUNT value on done: 1674.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:24,093][63735] DAMAGECOUNT value on done: 1456.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:24,094][63735] Sum rewards: -5.382, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.460', 'AMMO5': '0.005', 'AMMO2': '0.008', 'WEAPON1': '0.030', 'AMMO4': '0.041', 'weapon5': '0.046', 'WEAPON4': '0.050', 'AMMO3': '0.078', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'weapon4': '0.128', 'DAMAGECOUNT': '0.387', 'ARMOR': '0.456', 'WEAPON3': '0.500', 'weapon2': '1.382', 'weapon3': '1.506'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:24,445][63735] DAMAGECOUNT value on done: 1704.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:24,446][63735] Sum rewards: -3.898, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.190', 'AMMO4': '-0.023', 'AMMO2': '-0.005', 'AMMO5': '0.005', 'WEAPON5': '0.050', 'HITCOUNT': '0.120', 'AMMO3': '0.157', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.850', 'weapon2': '1.204', 'weapon3': '1.258', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:24,957][63733] Updated weights for policy 1, policy_version 650 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:25,025][63734] DAMAGECOUNT value on done: 2216.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:25,025][63734] Sum rewards: -4.018, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.132', 'AMMO5': '0.020', 'AMMO2': '0.021', 'ARMOR': '0.044', 'weapon5': '0.050', 'AMMO4': '0.105', 'AMMO3': '0.125', 'weapon4': '0.174', 'WEAPON5': '0.200', 'HITCOUNT': '0.290', 'WEAPON4': '0.300', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.945', 'weapon2': '1.048', 'weapon3': '1.492', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:25,404][63734] DAMAGECOUNT value on done: 1986.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:27,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11537.0, 300 sec: 11468.8). Total num frames: 5283840. Throughput: 0: 1643.9, 1: 1233.2. Samples: 1318749. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:27,460][109198] Avg episode reward: [(0, '-5.177'), (1, '-5.583')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:27,467][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000652_2670592.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:27,468][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000638_2613248.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:27,528][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000347_1421312.pth\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:27,531][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000269_1101824.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:27,538][63454] Saving new best policy, reward=-5.177!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:28,320][63732] Updated weights for policy 0, policy_version 640 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:28,473][63769] DAMAGECOUNT value on done: 1481.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:28,474][63769] Sum rewards: -3.169, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.215', 'AMMO2': '0.007', 'HITCOUNT': '0.030', 'AMMO4': '0.033', 'WEAPON4': '0.050', 'ARMOR': '0.052', 'DAMAGECOUNT': '0.060', 'weapon4': '0.082', 'AMMO3': '0.132', 'WEAPON3': '0.600', 'weapon3': '0.994', 'FRAGCOUNT': '1.000', 'weapon2': '1.506'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:28,644][63771] DAMAGECOUNT value on done: 1359.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:28,644][63771] Sum rewards: -3.944, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.856', 'AMMO2': '0.011', 'WEAPON1': '0.020', 'ARMOR': '0.020', 'AMMO4': '0.056', 'HITCOUNT': '0.080', 'AMMO3': '0.097', 'DAMAGECOUNT': '0.402', 'WEAPON3': '0.450', 'weapon3': '0.930', 'FRAGCOUNT': '1.000', 'weapon2': '1.596'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:28,883][63769] DAMAGECOUNT value on done: 1433.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:28,884][63769] Sum rewards: -9.363, reward structure: {'DEATHCOUNT': '-12.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.456', 'AMMO5': '0.012', 'weapon7': '0.016', 'AMMO2': '0.017', 'weapon5': '0.028', 'ARMOR': '0.036', 'AMMO4': '0.083', 'AMMO3': '0.119', 'weapon4': '0.120', 'HITCOUNT': '0.130', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.750', 'weapon3': '1.280', 'weapon2': '1.662'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:28,944][63770] DAMAGECOUNT value on done: 1665.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:28,945][63770] Sum rewards: -6.784, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.981', 'weapon4': '0.004', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'ARMOR': '0.036', 'weapon5': '0.036', 'AMMO4': '0.084', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.156', 'DAMAGECOUNT': '0.321', 'WEAPON3': '0.900', 'weapon2': '1.024', 'weapon3': '1.794'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:29,066][63771] DAMAGECOUNT value on done: 1642.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:29,066][63771] Sum rewards: -3.425, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.048', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.018', 'AMMO4': '0.087', 'AMMO3': '0.097', 'WEAPON5': '0.100', 'weapon4': '0.128', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.576', 'WEAPON3': '0.600', 'weapon2': '0.914', 'FRAGCOUNT': '1.000', 'weapon3': '1.768'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:29,272][63770] DAMAGECOUNT value on done: 1651.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:29,273][63770] Sum rewards: -1.758, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.566', 'AMMO5': '0.005', 'AMMO2': '0.016', 'WEAPON5': '0.050', 'AMMO4': '0.078', 'AMMO3': '0.114', 'HITCOUNT': '0.160', 'WEAPON4': '0.200', 'weapon4': '0.262', 'ARMOR': '0.464', 'DAMAGECOUNT': '0.585', 'WEAPON3': '0.700', 'weapon3': '1.542', 'weapon2': '1.632', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:29,539][63769] DAMAGECOUNT value on done: 2065.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:29,540][63769] Sum rewards: -4.389, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.671', 'AMMO5': '0.012', 'weapon5': '0.014', 'AMMO2': '0.017', 'ARMOR': '0.063', 'AMMO4': '0.084', 'AMMO3': '0.087', 'weapon4': '0.174', 'WEAPON4': '0.200', 'HITCOUNT': '0.250', 'WEAPON5': '0.250', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.600', 'weapon2': '0.768', 'DAMAGECOUNT': '0.837', 'weapon3': '1.676'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:29,953][63769] DAMAGECOUNT value on done: 1275.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:29,953][63769] Sum rewards: 0.093, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-1.060', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'AMMO5': '0.005', 'HITCOUNT': '0.050', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.106', 'DAMAGECOUNT': '0.300', 'weapon4': '0.346', 'WEAPON3': '0.450', 'ARMOR': '0.481', 'weapon2': '0.852', 'FRAGCOUNT': '1.000', 'weapon3': '1.138'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:30,380][63806] DAMAGECOUNT value on done: 1955.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:30,381][63806] Sum rewards: -6.479, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.148', 'AMMO5': '0.007', 'AMMO2': '0.018', 'weapon5': '0.022', 'WEAPON1': '0.040', 'ARMOR': '0.064', 'HITCOUNT': '0.080', 'AMMO4': '0.091', 'WEAPON5': '0.150', 'AMMO3': '0.156', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.420', 'weapon4': '0.438', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.172', 'weapon2': '1.360'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:30,841][63806] DAMAGECOUNT value on done: 2153.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:30,842][63806] Sum rewards: -6.552, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.684', 'AMMO5': '0.009', 'AMMO2': '0.020', 'weapon5': '0.036', 'HITCOUNT': '0.080', 'AMMO4': '0.099', 'WEAPON5': '0.100', 'AMMO3': '0.101', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.372', 'weapon4': '0.376', 'ARMOR': '0.400', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.244', 'weapon2': '1.694'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:30,930][63806] DAMAGECOUNT value on done: 1300.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:31,371][63806] DAMAGECOUNT value on done: 2073.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:31,371][63806] Sum rewards: -3.228, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.110', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'AMMO2': '0.019', 'ARMOR': '0.020', 'WEAPON4': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.092', 'AMMO4': '0.096', 'weapon4': '0.100', 'weapon5': '0.136', 'DAMAGECOUNT': '0.225', 'WEAPON5': '0.300', 'WEAPON3': '0.450', 'weapon2': '0.968', 'weapon3': '1.590'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:32,458][109198] Fps is (10 sec: 10649.6, 60 sec: 11400.5, 300 sec: 11441.0). Total num frames: 5332992. Throughput: 0: 1661.7, 1: 1204.0. Samples: 1326960. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:32,459][109198] Avg episode reward: [(0, '-5.238'), (1, '-5.359')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:34,616][63771] DAMAGECOUNT value on done: 1650.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:34,974][63732] Updated weights for policy 0, policy_version 650 (0.0015)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:35,113][63771] DAMAGECOUNT value on done: 2567.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:35,114][63771] Sum rewards: -4.448, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.785', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.005', 'weapon5': '0.006', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'AMMO3': '0.134', 'HITCOUNT': '0.250', 'FRAGCOUNT': '0.500', 'weapon2': '0.646', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.945', 'weapon3': '2.120'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:36,631][63733] Updated weights for policy 1, policy_version 660 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:36,968][63735] DAMAGECOUNT value on done: 2307.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:36,969][63735] Sum rewards: -3.668, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.650', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'weapon4': '0.038', 'WEAPON4': '0.050', 'ARMOR': '0.068', 'HITCOUNT': '0.070', 'AMMO3': '0.088', 'WEAPON5': '0.100', 'weapon5': '0.104', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.450', 'FRAGCOUNT': '0.500', 'weapon3': '1.014', 'weapon2': '1.108'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:37,400][63735] DAMAGECOUNT value on done: 2315.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:37,401][63735] Sum rewards: -4.021, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.560', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.017', 'AMMO2': '-0.003', 'weapon5': '0.006', 'AMMO5': '0.009', 'ARMOR': '0.040', 'AMMO3': '0.093', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.116', 'HITCOUNT': '0.120', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.600', 'weapon3': '1.024', 'weapon2': '1.370'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:37,458][109198] Fps is (10 sec: 9420.9, 60 sec: 11195.7, 300 sec: 11413.3). Total num frames: 5378048. Throughput: 0: 1631.3, 1: 1153.5. Samples: 1340664. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:37,460][109198] Avg episode reward: [(0, '-5.174'), (1, '-5.309')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:37,466][63454] Saving new best policy, reward=-5.174!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:37,466][63576] Saving new best policy, reward=-5.309!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:41,368][63732] Updated weights for policy 0, policy_version 660 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:41,993][63770] DAMAGECOUNT value on done: 1280.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:42,325][63770] DAMAGECOUNT value on done: 2111.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:42,458][109198] Fps is (10 sec: 9830.4, 60 sec: 11127.5, 300 sec: 11399.4). Total num frames: 5431296. Throughput: 0: 1632.0, 1: 1117.3. Samples: 1356547. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:42,460][109198] Avg episode reward: [(0, '-5.218'), (1, '-5.309')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:45,292][63805] DAMAGECOUNT value on done: 1580.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:45,292][63805] Sum rewards: -2.870, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.882', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.017', 'WEAPON1': '0.020', 'AMMO4': '0.083', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.141', 'WEAPON5': '0.150', 'weapon7': '0.154', 'AMMO6': '0.220', 'AMMO7': '0.220', 'DAMAGECOUNT': '0.273', 'WEAPON7': '0.300', 'ARMOR': '0.460', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.338', 'weapon2': '1.658'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:45,688][63805] DAMAGECOUNT value on done: 2362.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:45,689][63805] Sum rewards: -3.926, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.342', 'AMMO2': '0.000', 'AMMO4': '0.002', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'weapon5': '0.034', 'WEAPON5': '0.100', 'HITCOUNT': '0.130', 'AMMO3': '0.170', 'WEAPON4': '0.200', 'weapon4': '0.262', 'DAMAGECOUNT': '0.387', 'ARMOR': '0.518', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.254', 'weapon3': '1.684'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:46,142][63733] Updated weights for policy 1, policy_version 670 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:46,605][63767] DAMAGECOUNT value on done: 2029.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:46,605][63767] Sum rewards: -0.014, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.596', 'AMMO2': '0.007', 'AMMO5': '0.013', 'weapon5': '0.016', 'AMMO4': '0.032', 'WEAPON4': '0.050', 'weapon4': '0.066', 'AMMO3': '0.115', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon7': '0.128', 'WEAPON5': '0.150', 'WEAPON7': '0.200', 'HITCOUNT': '0.220', 'ARMOR': '0.428', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.807', 'weapon2': '1.396', 'weapon3': '1.514', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:46,999][63767] DAMAGECOUNT value on done: 1823.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:47,309][63734] DAMAGECOUNT value on done: 1751.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:47,310][63734] Sum rewards: 0.103, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.385', 'weapon4': '0.004', 'AMMO5': '0.010', 'AMMO2': '0.016', 'weapon5': '0.016', 'WEAPON1': '0.030', 'weapon7': '0.034', 'WEAPON4': '0.050', 'AMMO4': '0.077', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.116', 'HITCOUNT': '0.150', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.453', 'WEAPON3': '0.500', 'ARMOR': '0.536', 'weapon2': '1.048', 'weapon3': '1.698', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:47,439][63732] Updated weights for policy 0, policy_version 670 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:47,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11127.5, 300 sec: 11413.3). Total num frames: 5492736. Throughput: 0: 1637.7, 1: 1108.6. Samples: 1365001. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:47,460][109198] Avg episode reward: [(0, '-5.059'), (1, '-5.309')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:47,468][63454] Saving new best policy, reward=-5.059!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:47,718][63734] DAMAGECOUNT value on done: 2036.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:47,719][63734] Sum rewards: 0.831, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.182', 'AMMO5': '0.012', 'AMMO2': '0.013', 'WEAPON1': '0.020', 'weapon5': '0.020', 'ARMOR': '0.052', 'AMMO4': '0.064', 'AMMO3': '0.148', 'WEAPON5': '0.150', 'HITCOUNT': '0.190', 'WEAPON4': '0.200', 'weapon4': '0.218', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.906', 'weapon2': '1.550', 'weapon3': '1.620', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:48,278][63767] DAMAGECOUNT value on done: 2559.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:48,279][63767] Sum rewards: -2.179, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.202', 'ARMOR': '0.004', 'AMMO2': '0.005', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.023', 'weapon7': '0.046', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.146', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.280', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.750', 'weapon2': '0.906', 'weapon3': '1.428', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:48,595][63767] DAMAGECOUNT value on done: 2074.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:48,595][63767] Sum rewards: -5.780, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-0.500', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.029', 'AMMO3': '0.079', 'weapon5': '0.084', 'HEALTH': '0.096', 'weapon4': '0.112', 'HITCOUNT': '0.120', 'AMMO4': '0.142', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.576', 'weapon3': '1.112', 'weapon2': '2.048'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:48,776][63805] DAMAGECOUNT value on done: 1460.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:48,776][63805] Sum rewards: -3.547, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.714', 'AMMO2': '0.013', 'AMMO5': '0.023', 'weapon5': '0.034', 'AMMO4': '0.063', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.150', 'WEAPON5': '0.250', 'weapon4': '0.256', 'DAMAGECOUNT': '0.390', 'ARMOR': '0.420', 'WEAPON3': '0.950', 'weapon2': '1.006', 'weapon3': '1.912', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:49,180][63805] DAMAGECOUNT value on done: 1843.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:49,181][63805] Sum rewards: -5.136, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.290', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.012', 'WEAPON4': '0.050', 'HITCOUNT': '0.050', 'weapon4': '0.054', 'weapon5': '0.074', 'AMMO3': '0.158', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.850', 'weapon3': '1.384', 'weapon2': '1.470'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:50,636][63735] DAMAGECOUNT value on done: 1506.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:50,637][63735] Sum rewards: -3.105, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.718', 'AMMO2': '0.012', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'weapon5': '0.028', 'ARMOR': '0.032', 'HITCOUNT': '0.050', 'weapon4': '0.052', 'AMMO4': '0.062', 'AMMO3': '0.129', 'DAMAGECOUNT': '0.150', 'WEAPON4': '0.150', 'WEAPON5': '0.250', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.542', 'weapon3': '1.668'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:51,016][63735] DAMAGECOUNT value on done: 1714.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:51,661][63734] DAMAGECOUNT value on done: 2357.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:52,063][63734] DAMAGECOUNT value on done: 2081.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:52,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11127.5, 300 sec: 11413.3). Total num frames: 5545984. Throughput: 0: 1618.5, 1: 1116.2. Samples: 1381882. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:52,460][109198] Avg episode reward: [(0, '-4.940'), (1, '-5.318')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:52,461][63454] Saving new best policy, reward=-4.940!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:53,151][63806] DAMAGECOUNT value on done: 2000.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:53,480][63806] DAMAGECOUNT value on done: 1432.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:53,744][63733] Updated weights for policy 1, policy_version 680 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:54,784][63732] Updated weights for policy 0, policy_version 680 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:55,089][63769] DAMAGECOUNT value on done: 1676.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:55,090][63769] Sum rewards: -4.103, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.127', 'AMMO4': '-0.000', 'AMMO2': '0.000', 'AMMO5': '0.009', 'weapon4': '0.012', 'WEAPON1': '0.020', 'weapon5': '0.024', 'ARMOR': '0.032', 'WEAPON4': '0.100', 'AMMO3': '0.116', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.585', 'weapon2': '1.476', 'weapon3': '1.520'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:55,315][63771] DAMAGECOUNT value on done: 1534.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:55,316][63771] Sum rewards: 0.267, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.850', 'AMMO5': '0.003', 'weapon5': '0.010', 'AMMO2': '0.012', 'WEAPON1': '0.030', 'WEAPON5': '0.050', 'AMMO4': '0.059', 'weapon4': '0.090', 'WEAPON4': '0.100', 'weapon7': '0.110', 'HITCOUNT': '0.120', 'AMMO3': '0.148', 'AMMO6': '0.320', 'AMMO7': '0.320', 'WEAPON7': '0.400', 'DAMAGECOUNT': '0.525', 'WEAPON3': '0.700', 'weapon3': '1.236', 'weapon2': '1.634', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:55,526][63769] DAMAGECOUNT value on done: 1843.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:55,526][63769] Sum rewards: -2.946, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.726', 'AMMO5': '0.010', 'AMMO2': '0.015', 'weapon5': '0.030', 'AMMO4': '0.076', 'weapon7': '0.084', 'WEAPON5': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.126', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.204', 'HITCOUNT': '0.260', 'ARMOR': '0.424', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.230', 'weapon2': '1.430', 'FRAGCOUNT': '1.500', 'weapon3': '1.600'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:55,596][63770] DAMAGECOUNT value on done: 2163.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:55,597][63770] Sum rewards: -4.137, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.980', 'AMMO2': '0.003', 'AMMO4': '0.015', 'AMMO5': '0.017', 'ARMOR': '0.028', 'AMMO3': '0.103', 'HITCOUNT': '0.180', 'weapon5': '0.196', 'WEAPON5': '0.450', 'WEAPON3': '0.550', 'weapon2': '1.482', 'DAMAGECOUNT': '1.494', 'weapon3': '1.574', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:55,714][63771] DAMAGECOUNT value on done: 1838.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:55,715][63771] Sum rewards: -1.272, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.740', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.005', 'weapon5': '0.008', 'WEAPON5': '0.050', 'AMMO3': '0.091', 'HITCOUNT': '0.140', 'WEAPON3': '0.300', 'ARMOR': '0.454', 'DAMAGECOUNT': '0.588', 'weapon2': '1.288', 'weapon3': '1.290', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:56,005][63770] DAMAGECOUNT value on done: 1801.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:56,006][63770] Sum rewards: -4.617, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.640', 'AMMO2': '0.020', 'weapon4': '0.030', 'ARMOR': '0.032', 'AMMO4': '0.097', 'WEAPON4': '0.100', 'HITCOUNT': '0.120', 'AMMO3': '0.150', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.900', 'weapon2': '1.134', 'weapon3': '1.740', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:56,172][63769] DAMAGECOUNT value on done: 2228.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:56,173][63769] Sum rewards: -4.578, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.350', 'AMMO2': '0.006', 'AMMO5': '0.014', 'AMMO4': '0.032', 'WEAPON4': '0.050', 'weapon4': '0.056', 'weapon5': '0.072', 'AMMO3': '0.117', 'HITCOUNT': '0.190', 'WEAPON5': '0.300', 'ARMOR': '0.484', 'DAMAGECOUNT': '0.489', 'WEAPON3': '0.650', 'weapon2': '1.620', 'weapon3': '1.692'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:56,558][63769] DAMAGECOUNT value on done: 1325.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:57,087][63806] DAMAGECOUNT value on done: 2298.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:57,087][63806] Sum rewards: -4.104, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.111', 'AMMO5': '0.003', 'AMMO2': '0.004', 'AMMO4': '0.018', 'HITCOUNT': '0.080', 'AMMO3': '0.140', 'WEAPON4': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon4': '0.376', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.850', 'weapon2': '0.932', 'FRAGCOUNT': '1.000', 'weapon3': '1.620'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:57,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11127.5, 300 sec: 11413.3). Total num frames: 5603328. Throughput: 0: 1595.5, 1: 1136.9. Samples: 1398478. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:44:57,460][109198] Avg episode reward: [(0, '-4.708'), (1, '-5.344')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:57,466][63454] Saving new best policy, reward=-4.708!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:57,485][63806] DAMAGECOUNT value on done: 2479.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:57,486][63806] Sum rewards: -4.801, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.169', 'AMMO2': '0.011', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.054', 'AMMO3': '0.113', 'weapon5': '0.124', 'weapon4': '0.188', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'HITCOUNT': '0.250', 'WEAPON3': '0.700', 'ARMOR': '0.937', 'DAMAGECOUNT': '1.218', 'weapon3': '1.484', 'weapon2': '1.556', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:59,272][63735] DAMAGECOUNT value on done: 2452.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:59,631][63735] DAMAGECOUNT value on done: 2415.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:44:59,631][63735] Sum rewards: -5.277, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.086', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'AMMO2': '0.016', 'weapon5': '0.018', 'WEAPON5': '0.050', 'HITCOUNT': '0.080', 'AMMO4': '0.081', 'AMMO3': '0.129', 'WEAPON4': '0.200', 'weapon4': '0.236', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.750', 'weapon2': '1.158', 'weapon3': '1.536'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:00,280][63771] DAMAGECOUNT value on done: 1815.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:00,281][63771] Sum rewards: 0.728, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.776', 'AMMO2': '0.008', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.020', 'AMMO4': '0.041', 'WEAPON4': '0.050', 'weapon5': '0.066', 'AMMO3': '0.140', 'HITCOUNT': '0.170', 'weapon4': '0.180', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.700', 'weapon2': '1.134', 'weapon3': '1.964', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:00,624][63771] DAMAGECOUNT value on done: 2963.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:00,624][63771] Sum rewards: -4.282, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-1.030', 'AMMO5': '0.010', 'weapon5': '0.010', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'AMMO2': '0.034', 'AMMO3': '0.144', 'AMMO4': '0.172', 'WEAPON5': '0.200', 'weapon4': '0.200', 'HITCOUNT': '0.320', 'WEAPON4': '0.400', 'WEAPON3': '0.800', 'weapon2': '1.168', 'DAMAGECOUNT': '1.188', 'weapon3': '1.550', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:01,021][63733] Updated weights for policy 1, policy_version 690 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:02,147][63732] Updated weights for policy 0, policy_version 690 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:02,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11127.4, 300 sec: 11399.4). Total num frames: 5660672. Throughput: 0: 1580.4, 1: 1147.2. Samples: 1406960. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:02,460][109198] Avg episode reward: [(0, '-4.648'), (1, '-5.312')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:02,462][63454] Saving new best policy, reward=-4.648!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:07,263][63770] DAMAGECOUNT value on done: 1435.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:07,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11059.2, 300 sec: 11399.4). Total num frames: 5713920. Throughput: 0: 1540.8, 1: 1179.3. Samples: 1424072. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:07,460][109198] Avg episode reward: [(0, '-4.682'), (1, '-5.312')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:07,663][63770] DAMAGECOUNT value on done: 2126.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:07,737][63733] Updated weights for policy 1, policy_version 700 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:09,175][63767] DAMAGECOUNT value on done: 2409.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:09,175][63767] Sum rewards: -5.735, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-1.344', 'weapon5': '0.014', 'AMMO5': '0.015', 'AMMO2': '0.015', 'AMMO4': '0.075', 'AMMO3': '0.202', 'WEAPON4': '0.250', 'weapon4': '0.282', 'HITCOUNT': '0.290', 'WEAPON5': '0.300', 'ARMOR': '0.451', 'weapon2': '0.952', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.140', 'FRAGCOUNT': '2.000', 'weapon3': '2.072'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:09,494][63767] DAMAGECOUNT value on done: 2171.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:09,495][63767] Sum rewards: -3.132, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.024', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'WEAPON1': '0.020', 'weapon4': '0.020', 'AMMO5': '0.022', 'ARMOR': '0.024', 'WEAPON4': '0.050', 'weapon5': '0.078', 'AMMO3': '0.166', 'HITCOUNT': '0.290', 'WEAPON5': '0.350', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.044', 'weapon3': '1.386', 'weapon2': '1.808', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:09,883][63732] Updated weights for policy 0, policy_version 700 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:09,975][63805] DAMAGECOUNT value on done: 1665.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:09,976][63805] Sum rewards: -0.994, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.370', 'AMMO2': '0.006', 'AMMO5': '0.015', 'AMMO4': '0.027', 'WEAPON4': '0.050', 'weapon5': '0.050', 'HITCOUNT': '0.080', 'weapon4': '0.152', 'AMMO3': '0.165', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.255', 'ARMOR': '0.464', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.700', 'weapon2': '1.468', 'weapon3': '1.944'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:10,296][63734] DAMAGECOUNT value on done: 1776.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:10,309][63805] DAMAGECOUNT value on done: 2527.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:10,309][63805] Sum rewards: -6.925, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.130', 'AMMO4': '-0.031', 'AMMO2': '-0.006', 'weapon7': '0.072', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.120', 'AMMO3': '0.155', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.048', 'weapon3': '1.562'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:10,682][63734] DAMAGECOUNT value on done: 2091.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:10,683][63734] Sum rewards: -9.103, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.888', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'weapon5': '0.012', 'AMMO2': '0.018', 'weapon7': '0.054', 'HITCOUNT': '0.060', 'weapon4': '0.062', 'AMMO4': '0.090', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON5': '0.100', 'ARMOR': '0.111', 'DAMAGECOUNT': '0.165', 'WEAPON4': '0.200', 'AMMO3': '0.228', 'weapon2': '1.178', 'WEAPON3': '1.200', 'weapon3': '1.502'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:10,719][63767] DAMAGECOUNT value on done: 2750.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:10,719][63767] Sum rewards: -1.961, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.780', 'AMMO2': '0.010', 'AMMO5': '0.032', 'AMMO4': '0.051', 'weapon4': '0.078', 'AMMO3': '0.083', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.132', 'HITCOUNT': '0.150', 'weapon7': '0.154', 'WEAPON5': '0.550', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.573', 'FRAGCOUNT': '1.000', 'weapon2': '1.084', 'weapon3': '1.472'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:11,046][63767] DAMAGECOUNT value on done: 2349.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:11,047][63767] Sum rewards: -1.439, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.478', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'weapon4': '0.024', 'weapon5': '0.032', 'WEAPON4': '0.050', 'AMMO3': '0.130', 'weapon7': '0.176', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.230', 'WEAPON5': '0.250', 'ARMOR': '0.525', 'DAMAGECOUNT': '0.825', 'WEAPON3': '0.850', 'weapon3': '1.518', 'weapon2': '1.566', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:11,562][63805] DAMAGECOUNT value on done: 1686.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:11,562][63805] Sum rewards: -0.990, reward structure: {'DEATHCOUNT': '-10.500', 'AMMO5': '0.015', 'weapon5': '0.024', 'AMMO2': '0.030', 'weapon7': '0.074', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'HEALTH': '0.122', 'weapon4': '0.124', 'AMMO3': '0.136', 'WEAPON4': '0.150', 'AMMO4': '0.150', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'ARMOR': '0.416', 'DAMAGECOUNT': '0.678', 'WEAPON3': '0.750', 'weapon2': '1.190', 'weapon3': '1.880', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:11,897][63805] DAMAGECOUNT value on done: 2286.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:11,897][63805] Sum rewards: 3.566, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.773', 'AMMO4': '-0.003', 'AMMO2': '-0.000', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'WEAPON5': '0.050', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.140', 'weapon7': '0.220', 'HITCOUNT': '0.300', 'ARMOR': '0.400', 'WEAPON3': '0.600', 'weapon3': '1.310', 'DAMAGECOUNT': '1.329', 'weapon2': '1.680', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:12,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11059.2, 300 sec: 11399.4). Total num frames: 5771264. Throughput: 0: 1473.1, 1: 1238.6. Samples: 1440775. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:12,460][109198] Avg episode reward: [(0, '-4.503'), (1, '-5.328')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:12,461][63454] Saving new best policy, reward=-4.503!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:14,752][63733] Updated weights for policy 1, policy_version 710 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:15,080][63735] DAMAGECOUNT value on done: 1691.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:15,080][63735] Sum rewards: -5.723, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.829', 'weapon5': '0.014', 'AMMO2': '0.023', 'AMMO5': '0.028', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'weapon4': '0.054', 'AMMO4': '0.114', 'HITCOUNT': '0.150', 'AMMO3': '0.223', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.555', 'WEAPON3': '1.150', 'weapon2': '1.310', 'FRAGCOUNT': '2.000', 'weapon3': '2.050'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:15,513][63735] DAMAGECOUNT value on done: 1814.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:15,652][63806] DAMAGECOUNT value on done: 2154.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:16,027][63806] DAMAGECOUNT value on done: 1533.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:16,027][63806] Sum rewards: -3.309, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.096', 'AMMO2': '0.008', 'AMMO5': '0.010', 'AMMO4': '0.037', 'HITCOUNT': '0.070', 'ARMOR': '0.072', 'WEAPON5': '0.100', 'AMMO3': '0.111', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.303', 'weapon4': '0.620', 'WEAPON3': '0.700', 'weapon2': '0.942', 'FRAGCOUNT': '1.000', 'weapon3': '1.264'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:16,652][63734] DAMAGECOUNT value on done: 2682.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:16,653][63734] Sum rewards: 0.937, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.003', 'AMMO2': '0.009', 'weapon5': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.044', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'weapon4': '0.088', 'AMMO3': '0.115', 'HITCOUNT': '0.280', 'WEAPON3': '0.550', 'HEALTH': '0.598', 'DAMAGECOUNT': '0.975', 'FRAGCOUNT': '1.000', 'weapon2': '1.212', 'weapon3': '1.944'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:17,122][63734] DAMAGECOUNT value on done: 2081.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:17,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10922.7, 300 sec: 11385.5). Total num frames: 5824512. Throughput: 0: 1433.1, 1: 1280.8. Samples: 1449087. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:17,460][109198] Avg episode reward: [(0, '-4.461'), (1, '-5.379')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:17,466][63454] Saving new best policy, reward=-4.461!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:17,762][63732] Updated weights for policy 0, policy_version 710 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:20,391][63769] DAMAGECOUNT value on done: 1891.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:20,644][63771] DAMAGECOUNT value on done: 1802.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:20,645][63771] Sum rewards: -2.647, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.407', 'AMMO5': '0.003', 'AMMO2': '0.034', 'WEAPON5': '0.050', 'weapon7': '0.058', 'AMMO3': '0.171', 'AMMO4': '0.172', 'weapon4': '0.182', 'HITCOUNT': '0.280', 'AMMO6': '0.300', 'WEAPON7': '0.300', 'AMMO7': '0.300', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.804', 'WEAPON3': '0.950', 'weapon2': '1.192', 'weapon3': '1.864', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:20,785][63769] DAMAGECOUNT value on done: 1983.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:20,785][63769] Sum rewards: -3.061, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.516', 'weapon4': '0.010', 'AMMO2': '0.015', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.060', 'AMMO4': '0.074', 'weapon5': '0.076', 'WEAPON4': '0.100', 'HITCOUNT': '0.130', 'AMMO3': '0.151', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.750', 'weapon2': '1.646', 'weapon3': '1.738', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:20,988][63770] DAMAGECOUNT value on done: 2307.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:21,044][63771] DAMAGECOUNT value on done: 1928.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:21,044][63771] Sum rewards: -3.855, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.455', 'AMMO5': '0.003', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'weapon5': '0.022', 'ARMOR': '0.024', 'AMMO4': '0.043', 'WEAPON5': '0.050', 'HITCOUNT': '0.080', 'AMMO3': '0.122', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.700', 'weapon2': '0.876', 'FRAGCOUNT': '1.000', 'weapon3': '1.642'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:21,389][63770] DAMAGECOUNT value on done: 1901.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:21,390][63770] Sum rewards: -6.911, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.030', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'ARMOR': '0.037', 'HITCOUNT': '0.090', 'AMMO3': '0.176', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.194', 'weapon3': '1.918'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:21,442][63769] DAMAGECOUNT value on done: 2346.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:21,805][63733] Updated weights for policy 1, policy_version 720 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:21,807][63806] DAMAGECOUNT value on done: 2563.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:21,807][63806] Sum rewards: 0.754, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.418', 'AMMO2': '0.011', 'AMMO4': '0.056', 'ARMOR': '0.076', 'AMMO3': '0.095', 'WEAPON4': '0.100', 'HITCOUNT': '0.170', 'weapon4': '0.206', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.795', 'FRAGCOUNT': '1.000', 'weapon2': '1.158', 'weapon3': '1.504'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:21,887][63769] DAMAGECOUNT value on done: 1550.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:21,887][63769] Sum rewards: -0.364, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.599', 'weapon5': '0.006', 'AMMO5': '0.007', 'AMMO2': '0.020', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'weapon4': '0.052', 'AMMO3': '0.091', 'AMMO4': '0.097', 'WEAPON4': '0.200', 'HITCOUNT': '0.210', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.675', 'weapon2': '0.908', 'weapon3': '1.824', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:22,040][63735] DAMAGECOUNT value on done: 2767.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:22,041][63735] Sum rewards: -1.148, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.488', 'weapon5': '0.002', 'AMMO2': '0.004', 'AMMO5': '0.010', 'weapon4': '0.018', 'AMMO4': '0.019', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'AMMO3': '0.076', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.945', 'weapon3': '1.380', 'weapon2': '1.480', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:22,151][63806] DAMAGECOUNT value on done: 2534.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:22,152][63806] Sum rewards: -9.042, reward structure: {'DEATHCOUNT': '-11.250', 'FRAGCOUNT': '-2.000', 'HEALTH': '-1.797', 'WEAPON1': '0.010', 'AMMO2': '0.012', 'AMMO5': '0.023', 'weapon4': '0.040', 'WEAPON4': '0.050', 'AMMO4': '0.058', 'HITCOUNT': '0.060', 'weapon5': '0.154', 'DAMAGECOUNT': '0.165', 'AMMO3': '0.198', 'ARMOR': '0.476', 'WEAPON5': '0.500', 'WEAPON3': '1.150', 'weapon2': '1.228', 'weapon3': '1.880'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:22,442][63735] DAMAGECOUNT value on done: 2615.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:22,443][63735] Sum rewards: 0.365, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.003', 'AMMO2': '0.011', 'AMMO4': '0.055', 'AMMO3': '0.088', 'ARMOR': '0.090', 'HEALTH': '0.090', 'WEAPON4': '0.150', 'HITCOUNT': '0.190', 'weapon4': '0.230', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.600', 'weapon2': '1.140', 'weapon3': '1.268', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:22,458][109198] Fps is (10 sec: 11468.9, 60 sec: 10990.9, 300 sec: 11413.3). Total num frames: 5885952. Throughput: 0: 1418.8, 1: 1356.4. Samples: 1465552. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:22,459][109198] Avg episode reward: [(0, '-4.443'), (1, '-5.212')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:22,461][63576] Saving new best policy, reward=-5.212!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:22,461][63454] Saving new best policy, reward=-4.443!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:23,841][63771] DAMAGECOUNT value on done: 2030.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:24,182][63771] DAMAGECOUNT value on done: 3063.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:24,182][63771] Sum rewards: -7.987, reward structure: {'DEATHCOUNT': '-12.000', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'AMMO2': '0.012', 'weapon5': '0.014', 'WEAPON4': '0.050', 'AMMO4': '0.060', 'ARMOR': '0.064', 'HITCOUNT': '0.070', 'WEAPON5': '0.100', 'weapon4': '0.104', 'HEALTH': '0.108', 'AMMO3': '0.158', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.750', 'weapon2': '1.282', 'weapon3': '1.436'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:25,532][63732] Updated weights for policy 0, policy_version 720 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:27,458][109198] Fps is (10 sec: 11468.7, 60 sec: 10922.7, 300 sec: 11385.5). Total num frames: 5939200. Throughput: 0: 1379.6, 1: 1418.7. Samples: 1482470. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:27,460][109198] Avg episode reward: [(0, '-4.443'), (1, '-5.244')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:28,644][63733] Updated weights for policy 1, policy_version 730 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:31,417][63767] DAMAGECOUNT value on done: 2538.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:31,418][63767] Sum rewards: -6.250, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.802', 'AMMO5': '0.005', 'AMMO2': '0.017', 'AMMO4': '0.084', 'ARMOR': '0.089', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.116', 'WEAPON4': '0.200', 'weapon4': '0.260', 'DAMAGECOUNT': '0.387', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.062', 'weapon2': '1.432'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:31,794][63767] DAMAGECOUNT value on done: 2205.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:31,795][63767] Sum rewards: -5.294, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.220', 'FRAGCOUNT': '-1.500', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'HITCOUNT': '0.040', 'WEAPON4': '0.050', 'weapon5': '0.068', 'DAMAGECOUNT': '0.102', 'weapon7': '0.122', 'AMMO3': '0.142', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.850', 'weapon2': '1.156', 'weapon3': '1.734'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:32,458][109198] Fps is (10 sec: 10649.5, 60 sec: 10990.9, 300 sec: 11385.5). Total num frames: 5992448. Throughput: 0: 1355.3, 1: 1443.5. Samples: 1490948. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:32,460][109198] Avg episode reward: [(0, '-4.443'), (1, '-5.244')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:32,605][63770] DAMAGECOUNT value on done: 1585.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:32,951][63767] DAMAGECOUNT value on done: 2902.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:32,951][63767] Sum rewards: -7.121, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.915', 'AMMO5': '0.005', 'AMMO2': '0.015', 'ARMOR': '0.040', 'AMMO4': '0.075', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.234', 'DAMAGECOUNT': '0.456', 'FRAGCOUNT': '1.000', 'weapon2': '1.076', 'WEAPON3': '1.250', 'weapon3': '2.302'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:32,987][63770] DAMAGECOUNT value on done: 2296.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:32,987][63770] Sum rewards: -2.554, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.310', 'AMMO2': '0.013', 'AMMO3': '0.062', 'AMMO4': '0.066', 'WEAPON4': '0.100', 'ARMOR': '0.121', 'HITCOUNT': '0.160', 'weapon4': '0.378', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.510', 'weapon3': '0.908', 'FRAGCOUNT': '1.000', 'weapon2': '1.038'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:33,258][63732] Updated weights for policy 0, policy_version 730 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:33,338][63767] DAMAGECOUNT value on done: 2772.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:33,338][63767] Sum rewards: 0.865, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.211', 'AMMO5': '0.008', 'AMMO2': '0.016', 'weapon4': '0.050', 'weapon5': '0.054', 'AMMO3': '0.080', 'AMMO4': '0.081', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.310', 'WEAPON3': '0.350', 'weapon3': '1.236', 'DAMAGECOUNT': '1.269', 'weapon2': '1.822', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:33,777][63734] DAMAGECOUNT value on done: 1953.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:33,777][63734] Sum rewards: -8.828, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.156', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.007', 'weapon5': '0.010', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'ARMOR': '0.044', 'AMMO4': '0.059', 'AMMO3': '0.125', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.531', 'WEAPON3': '0.650', 'weapon3': '1.358', 'weapon2': '1.722'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:34,126][63734] DAMAGECOUNT value on done: 2262.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:34,127][63734] Sum rewards: -2.527, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.016', 'AMMO2': '0.003', 'AMMO4': '0.016', 'WEAPON1': '0.020', 'ARMOR': '0.080', 'HITCOUNT': '0.120', 'AMMO3': '0.129', 'DAMAGECOUNT': '0.513', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.056', 'weapon3': '1.602'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:34,279][63805] DAMAGECOUNT value on done: 1831.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:34,591][63805] DAMAGECOUNT value on done: 2401.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:34,772][63805] DAMAGECOUNT value on done: 1865.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:34,772][63805] Sum rewards: -5.328, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.486', 'AMMO5': '0.015', 'AMMO2': '0.015', 'weapon5': '0.048', 'weapon7': '0.048', 'AMMO4': '0.076', 'HITCOUNT': '0.080', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'AMMO3': '0.197', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon4': '0.204', 'DAMAGECOUNT': '0.600', 'WEAPON3': '1.050', 'weapon2': '1.174', 'weapon3': '1.750', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:35,209][63805] DAMAGECOUNT value on done: 2733.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:35,209][63805] Sum rewards: -1.319, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.343', 'AMMO5': '0.003', 'weapon4': '0.004', 'AMMO2': '0.007', 'AMMO4': '0.035', 'WEAPON5': '0.050', 'weapon7': '0.058', 'ARMOR': '0.084', 'AMMO3': '0.091', 'WEAPON4': '0.100', 'HITCOUNT': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.618', 'weapon2': '0.976', 'FRAGCOUNT': '1.000', 'weapon3': '1.498'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:35,486][63733] Updated weights for policy 1, policy_version 740 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:37,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11195.7, 300 sec: 11399.4). Total num frames: 6049792. Throughput: 0: 1332.2, 1: 1465.9. Samples: 1507795. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:37,460][109198] Avg episode reward: [(0, '-4.362'), (1, '-5.125')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:37,466][63454] Saving new best policy, reward=-4.362!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:37,466][63576] Saving new best policy, reward=-5.125!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:38,626][63806] DAMAGECOUNT value on done: 2318.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:38,626][63806] Sum rewards: -5.556, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.045', 'AMMO2': '0.004', 'weapon5': '0.008', 'AMMO4': '0.019', 'AMMO5': '0.020', 'AMMO3': '0.098', 'WEAPON4': '0.100', 'weapon4': '0.124', 'HITCOUNT': '0.140', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.492', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.314', 'weapon3': '1.320'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:39,019][63806] DAMAGECOUNT value on done: 1668.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:39,020][63806] Sum rewards: -4.915, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.700', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.007', 'AMMO2': '0.008', 'ARMOR': '0.020', 'weapon5': '0.024', 'AMMO4': '0.039', 'HITCOUNT': '0.080', 'AMMO3': '0.105', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.550', 'weapon3': '0.888', 'weapon2': '1.508'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:39,709][63735] DAMAGECOUNT value on done: 1735.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:40,032][63735] DAMAGECOUNT value on done: 2062.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:40,033][63735] Sum rewards: -8.941, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.735', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.008', 'AMMO5': '0.010', 'AMMO4': '0.042', 'WEAPON4': '0.050', 'weapon4': '0.050', 'weapon5': '0.054', 'ARMOR': '0.060', 'AMMO3': '0.114', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.744', 'weapon2': '1.116', 'weapon3': '1.696'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:40,805][63735] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:41,101][63732] Updated weights for policy 0, policy_version 740 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:41,609][63734] DAMAGECOUNT value on done: 2785.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:42,095][63734] DAMAGECOUNT value on done: 2191.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:42,095][63734] Sum rewards: -4.871, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.412', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.052', 'ARMOR': '0.056', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'weapon4': '0.114', 'AMMO3': '0.156', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.850', 'weapon2': '1.050', 'weapon3': '1.508', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:42,412][63733] Updated weights for policy 1, policy_version 750 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:42,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11264.0, 300 sec: 11385.5). Total num frames: 6107136. Throughput: 0: 1321.1, 1: 1478.5. Samples: 1524462. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:42,460][109198] Avg episode reward: [(0, '-4.465'), (1, '-5.036')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:42,461][63576] Saving new best policy, reward=-5.036!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:44,755][63735] DAMAGECOUNT value on done: 2847.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:44,755][63735] Sum rewards: -7.982, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.820', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'weapon5': '0.012', 'ARMOR': '0.033', 'AMMO2': '0.035', 'HITCOUNT': '0.070', 'AMMO3': '0.107', 'WEAPON5': '0.150', 'AMMO4': '0.172', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.240', 'weapon4': '0.384', 'WEAPON3': '0.450', 'weapon3': '0.582', 'weapon2': '1.636'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:45,035][63735] DAMAGECOUNT value on done: 2752.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:45,036][63735] Sum rewards: -7.168, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-3.005', 'AMMO5': '0.005', 'AMMO2': '0.013', 'WEAPON1': '0.020', 'AMMO4': '0.064', 'HITCOUNT': '0.080', 'WEAPON5': '0.100', 'AMMO3': '0.156', 'weapon4': '0.156', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.411', 'weapon2': '0.822', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '1.610'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:45,586][63769] DAMAGECOUNT value on done: 1931.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:45,910][63771] DAMAGECOUNT value on done: 1882.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:45,910][63771] Sum rewards: -6.705, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.632', 'AMMO5': '0.003', 'ARMOR': '0.008', 'AMMO2': '0.012', 'weapon4': '0.012', 'WEAPON5': '0.050', 'AMMO4': '0.058', 'weapon7': '0.070', 'HITCOUNT': '0.080', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.148', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.240', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.424', 'weapon3': '1.682'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:46,029][63769] DAMAGECOUNT value on done: 2240.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:46,030][63769] Sum rewards: -7.246, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.218', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.016', 'AMMO2': '0.020', 'weapon5': '0.034', 'AMMO4': '0.098', 'weapon4': '0.100', 'AMMO3': '0.146', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.771', 'WEAPON3': '0.850', 'weapon3': '1.356', 'weapon2': '1.626'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:46,204][63806] DAMAGECOUNT value on done: 2752.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:46,255][63771] DAMAGECOUNT value on done: 2068.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:46,273][63770] DAMAGECOUNT value on done: 2657.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:46,273][63770] Sum rewards: 0.938, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.656', 'AMMO2': '0.010', 'AMMO5': '0.012', 'weapon5': '0.032', 'WEAPON4': '0.050', 'AMMO4': '0.051', 'ARMOR': '0.076', 'weapon4': '0.122', 'WEAPON5': '0.150', 'AMMO3': '0.160', 'HITCOUNT': '0.300', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.050', 'weapon2': '1.146', 'weapon3': '1.834', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:46,577][63806] DAMAGECOUNT value on done: 2989.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:46,577][63806] Sum rewards: -4.645, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-3.230', 'AMMO4': '-0.031', 'AMMO2': '-0.006', 'WEAPON1': '0.020', 'weapon5': '0.032', 'AMMO5': '0.033', 'AMMO3': '0.215', 'HITCOUNT': '0.350', 'ARMOR': '0.410', 'WEAPON5': '0.450', 'weapon2': '0.894', 'DAMAGECOUNT': '1.365', 'WEAPON3': '1.400', 'weapon3': '2.454', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:46,623][63769] DAMAGECOUNT value on done: 2910.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:46,623][63769] Sum rewards: 3.735, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.320', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO4': '0.026', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.103', 'weapon7': '0.270', 'HITCOUNT': '0.330', 'ARMOR': '0.448', 'WEAPON3': '0.550', 'weapon2': '1.482', 'weapon3': '1.594', 'DAMAGECOUNT': '1.692', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:46,680][63770] DAMAGECOUNT value on done: 1996.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:46,680][63770] Sum rewards: -3.046, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.760', 'AMMO5': '0.005', 'AMMO2': '0.005', 'weapon5': '0.008', 'weapon7': '0.026', 'AMMO4': '0.027', 'ARMOR': '0.060', 'WEAPON5': '0.100', 'weapon4': '0.104', 'AMMO3': '0.106', 'HITCOUNT': '0.120', 'WEAPON4': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.650', 'weapon3': '0.974', 'FRAGCOUNT': '1.000', 'weapon2': '1.244'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:46,958][63769] DAMAGECOUNT value on done: 1615.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:46,959][63769] Sum rewards: -7.573, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.460', 'AMMO2': '0.001', 'AMMO5': '0.005', 'AMMO4': '0.006', 'WEAPON1': '0.020', 'weapon5': '0.028', 'WEAPON4': '0.050', 'weapon4': '0.064', 'HITCOUNT': '0.070', 'WEAPON5': '0.100', 'AMMO3': '0.158', 'DAMAGECOUNT': '0.195', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.184', 'weapon2': '1.506'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:47,300][63771] DAMAGECOUNT value on done: 2090.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:47,301][63771] Sum rewards: -6.474, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.180', 'AMMO5': '0.005', 'AMMO2': '0.014', 'weapon5': '0.018', 'ARMOR': '0.024', 'HITCOUNT': '0.060', 'AMMO4': '0.070', 'WEAPON5': '0.100', 'AMMO3': '0.165', 'DAMAGECOUNT': '0.180', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.264', 'weapon2': '1.506'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:47,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11195.7, 300 sec: 11399.4). Total num frames: 6164480. Throughput: 0: 1314.5, 1: 1481.3. Samples: 1532772. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:47,460][109198] Avg episode reward: [(0, '-4.339'), (1, '-5.070')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:47,467][63454] Saving new best policy, reward=-4.339!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:47,623][63771] DAMAGECOUNT value on done: 3088.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:47,624][63771] Sum rewards: -4.326, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.130', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'weapon5': '0.010', 'AMMO2': '0.019', 'HITCOUNT': '0.020', 'WEAPON5': '0.050', 'ARMOR': '0.072', 'DAMAGECOUNT': '0.075', 'AMMO4': '0.096', 'AMMO3': '0.135', 'WEAPON4': '0.200', 'weapon4': '0.224', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.146', 'weapon3': '1.244'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:48,942][63732] Updated weights for policy 0, policy_version 750 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:49,331][63733] Updated weights for policy 1, policy_version 760 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:52,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11195.7, 300 sec: 11371.6). Total num frames: 6217728. Throughput: 0: 1314.9, 1: 1476.9. Samples: 1549703. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:52,460][109198] Avg episode reward: [(0, '-4.339'), (1, '-5.098')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:53,751][63767] DAMAGECOUNT value on done: 3098.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:53,752][63767] Sum rewards: 1.111, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.220', 'weapon4': '0.010', 'AMMO5': '0.017', 'AMMO2': '0.023', 'AMMO3': '0.094', 'WEAPON4': '0.100', 'AMMO4': '0.113', 'weapon5': '0.248', 'HITCOUNT': '0.260', 'WEAPON5': '0.350', 'WEAPON3': '0.500', 'weapon3': '1.264', 'weapon2': '1.672', 'DAMAGECOUNT': '1.680', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:54,065][63767] DAMAGECOUNT value on done: 2455.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:54,065][63767] Sum rewards: -2.734, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.660', 'AMMO4': '-0.018', 'AMMO2': '-0.003', 'AMMO5': '0.010', 'ARMOR': '0.124', 'AMMO3': '0.139', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.750', 'weapon2': '1.136', 'weapon3': '1.678', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:55,331][63767] DAMAGECOUNT value on done: 3007.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:55,332][63767] Sum rewards: -6.893, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.386', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.056', 'HITCOUNT': '0.110', 'weapon5': '0.164', 'AMMO3': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.315', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.432', 'weapon2': '1.900'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:55,657][63767] DAMAGECOUNT value on done: 3374.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:55,658][63767] Sum rewards: 0.375, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.476', 'AMMO4': '-0.038', 'AMMO2': '-0.008', 'ARMOR': '0.020', 'AMMO5': '0.022', 'weapon5': '0.066', 'AMMO3': '0.122', 'WEAPON5': '0.300', 'HITCOUNT': '0.340', 'WEAPON3': '0.700', 'weapon2': '1.418', 'DAMAGECOUNT': '1.806', 'weapon3': '1.852', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:56,305][63733] Updated weights for policy 1, policy_version 770 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:56,669][63732] Updated weights for policy 0, policy_version 760 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:57,033][63805] DAMAGECOUNT value on done: 2035.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:57,363][63734] DAMAGECOUNT value on done: 1968.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:57,387][63805] DAMAGECOUNT value on done: 2630.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:57,388][63805] Sum rewards: -4.904, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.357', 'AMMO2': '0.008', 'AMMO5': '0.013', 'AMMO4': '0.039', 'weapon5': '0.058', 'ARMOR': '0.068', 'AMMO3': '0.140', 'HITCOUNT': '0.170', 'WEAPON5': '0.300', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.687', 'WEAPON3': '0.850', 'weapon2': '1.480', 'weapon3': '1.890'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:57,458][109198] Fps is (10 sec: 10649.5, 60 sec: 11127.5, 300 sec: 11357.7). Total num frames: 6270976. Throughput: 0: 1313.3, 1: 1476.6. Samples: 1566318. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:45:57,460][109198] Avg episode reward: [(0, '-4.306'), (1, '-5.091')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:57,498][63454] Saving new best policy, reward=-4.306!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:57,758][63734] DAMAGECOUNT value on done: 2592.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:57,759][63734] Sum rewards: -3.949, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.010', 'ARMOR': '0.024', 'weapon5': '0.038', 'WEAPON4': '0.050', 'AMMO4': '0.050', 'AMMO3': '0.074', 'weapon4': '0.098', 'WEAPON5': '0.150', 'HITCOUNT': '0.220', 'HEALTH': '0.330', 'WEAPON3': '0.400', 'weapon3': '0.934', 'DAMAGECOUNT': '0.990', 'weapon2': '1.412'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:58,029][63770] DAMAGECOUNT value on done: 1705.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:58,030][63770] Sum rewards: 2.377, reward structure: {'DEATHCOUNT': '-1.500', 'HEALTH': '-0.431', 'AMMO4': '-0.034', 'AMMO2': '-0.007', 'HITCOUNT': '0.070', 'AMMO3': '0.076', 'WEAPON3': '0.250', 'DAMAGECOUNT': '0.360', 'ARMOR': '0.477', 'weapon2': '0.574', 'FRAGCOUNT': '1.000', 'weapon3': '1.542'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:58,495][63770] DAMAGECOUNT value on done: 2366.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:58,495][63770] Sum rewards: -1.133, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.717', 'AMMO2': '0.000', 'AMMO4': '0.001', 'weapon5': '0.008', 'AMMO5': '0.010', 'weapon4': '0.022', 'WEAPON4': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.093', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.400', 'ARMOR': '0.484', 'FRAGCOUNT': '1.000', 'weapon2': '1.114', 'weapon3': '1.282'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:59,636][63805] DAMAGECOUNT value on done: 2320.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:45:59,636][63805] Sum rewards: -5.170, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.706', 'AMMO4': '-0.020', 'AMMO2': '-0.004', 'AMMO5': '0.008', 'weapon5': '0.028', 'WEAPON1': '0.030', 'WEAPON5': '0.150', 'AMMO3': '0.191', 'HITCOUNT': '0.300', 'ARMOR': '0.472', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.332', 'DAMAGECOUNT': '1.365', 'weapon2': '1.934'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:00,046][63805] DAMAGECOUNT value on done: 3018.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:00,047][63805] Sum rewards: -1.503, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.368', 'AMMO2': '0.011', 'AMMO4': '0.055', 'AMMO3': '0.107', 'HITCOUNT': '0.260', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.855', 'weapon2': '0.900', 'weapon3': '2.226', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:01,727][63806] DAMAGECOUNT value on done: 2646.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:01,727][63806] Sum rewards: -0.276, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.793', 'AMMO2': '0.009', 'AMMO5': '0.010', 'AMMO4': '0.046', 'weapon7': '0.068', 'AMMO3': '0.092', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.124', 'HITCOUNT': '0.220', 'WEAPON3': '0.450', 'ARMOR': '0.536', 'DAMAGECOUNT': '0.984', 'weapon2': '1.082', 'weapon3': '1.146', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:02,008][63805] Large shaping reward 2.632 for [('FRAGCOUNT', 2.0, 2.0), ('HITCOUNT', 0.03, 3.0), ('DAMAGECOUNT', 0.6, 200), ('weapon7', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:02,115][63806] DAMAGECOUNT value on done: 1703.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:02,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11127.5, 300 sec: 11357.7). Total num frames: 6328320. Throughput: 0: 1312.2, 1: 1478.2. Samples: 1574652. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:02,460][109198] Avg episode reward: [(0, '-4.244'), (1, '-4.868')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:02,461][63454] Saving new best policy, reward=-4.244!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:02,461][63576] Saving new best policy, reward=-4.868!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:03,347][63733] Updated weights for policy 1, policy_version 780 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:04,356][63735] DAMAGECOUNT value on done: 1939.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:04,357][63735] Sum rewards: -3.711, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.897', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'WEAPON1': '0.010', 'AMMO5': '0.025', 'ARMOR': '0.048', 'weapon5': '0.110', 'HITCOUNT': '0.170', 'AMMO3': '0.175', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.612', 'WEAPON3': '0.900', 'weapon2': '1.292', 'weapon3': '1.702', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:04,576][63732] Updated weights for policy 0, policy_version 770 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:04,780][63735] DAMAGECOUNT value on done: 2110.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:04,780][63735] Sum rewards: 0.499, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-0.386', 'AMMO2': '0.017', 'HITCOUNT': '0.040', 'AMMO3': '0.079', 'AMMO4': '0.085', 'ARMOR': '0.112', 'DAMAGECOUNT': '0.144', 'WEAPON4': '0.150', 'WEAPON3': '0.400', 'weapon4': '0.498', 'weapon3': '0.768', 'FRAGCOUNT': '1.000', 'weapon2': '1.342'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:07,113][63734] DAMAGECOUNT value on done: 2955.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:07,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11127.5, 300 sec: 11343.8). Total num frames: 6381568. Throughput: 0: 1313.9, 1: 1480.2. Samples: 1591289. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:07,460][109198] Avg episode reward: [(0, '-4.225'), (1, '-4.761')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:07,466][63454] Saving new best policy, reward=-4.225!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:07,480][63576] Saving new best policy, reward=-4.761!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:07,560][63734] DAMAGECOUNT value on done: 2218.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:07,707][63735] DAMAGECOUNT value on done: 2862.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:07,708][63735] Sum rewards: -7.377, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.150', 'AMMO5': '0.005', 'AMMO2': '0.007', 'HITCOUNT': '0.020', 'weapon4': '0.024', 'AMMO4': '0.033', 'DAMAGECOUNT': '0.045', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'AMMO3': '0.153', 'WEAPON3': '0.700', 'ARMOR': '0.812', 'weapon3': '0.998', 'FRAGCOUNT': '1.000', 'weapon2': '1.576'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:08,044][63735] DAMAGECOUNT value on done: 2772.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:10,301][63733] Updated weights for policy 1, policy_version 790 (0.0009)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:10,720][63806] DAMAGECOUNT value on done: 2764.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:10,735][63771] DAMAGECOUNT value on done: 2160.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:10,736][63771] Sum rewards: -4.433, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.126', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO4': '0.021', 'HITCOUNT': '0.060', 'ARMOR': '0.100', 'AMMO3': '0.143', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.800', 'weapon2': '0.924', 'weapon3': '1.920', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:11,087][63769] DAMAGECOUNT value on done: 2056.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:11,088][63769] Sum rewards: -6.382, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.936', 'AMMO2': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.049', 'HITCOUNT': '0.070', 'WEAPON4': '0.100', 'weapon4': '0.148', 'AMMO3': '0.172', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.272', 'weapon3': '1.648'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:11,095][63771] DAMAGECOUNT value on done: 2133.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:11,096][63771] Sum rewards: -8.785, reward structure: {'DEATHCOUNT': '-12.750', 'FRAGCOUNT': '-2.000', 'HEALTH': '-0.328', 'AMMO2': '0.008', 'AMMO5': '0.017', 'AMMO4': '0.038', 'weapon5': '0.098', 'HITCOUNT': '0.150', 'AMMO3': '0.167', 'WEAPON5': '0.250', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.753', 'ARMOR': '0.800', 'weapon2': '1.670', 'weapon3': '1.692'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:11,169][63771] DAMAGECOUNT value on done: 3303.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:11,170][63771] Sum rewards: -5.427, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.685', 'AMMO2': '0.002', 'weapon5': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.009', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'weapon4': '0.126', 'AMMO3': '0.161', 'HITCOUNT': '0.190', 'ARMOR': '0.432', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.068', 'weapon3': '1.418'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:11,182][63806] DAMAGECOUNT value on done: 3199.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:11,182][63806] Sum rewards: -5.983, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.609', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.020', 'AMMO2': '0.029', 'weapon5': '0.040', 'weapon4': '0.042', 'WEAPON4': '0.100', 'AMMO4': '0.144', 'AMMO3': '0.168', 'HITCOUNT': '0.180', 'WEAPON5': '0.250', 'ARMOR': '0.547', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.900', 'weapon2': '1.460', 'weapon3': '1.866'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:11,454][63769] DAMAGECOUNT value on done: 2410.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:11,454][63769] Sum rewards: -2.315, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.692', 'AMMO2': '0.012', 'weapon4': '0.018', 'weapon5': '0.034', 'AMMO5': '0.035', 'ARMOR': '0.042', 'AMMO4': '0.059', 'HITCOUNT': '0.150', 'AMMO3': '0.163', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.152', 'weapon3': '2.202'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:11,490][63771] DAMAGECOUNT value on done: 2153.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:11,889][63770] DAMAGECOUNT value on done: 2955.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:11,890][63770] Sum rewards: -2.897, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.750', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.011', 'WEAPON1': '0.020', 'AMMO5': '0.022', 'ARMOR': '0.035', 'weapon5': '0.038', 'AMMO4': '0.052', 'AMMO3': '0.119', 'HITCOUNT': '0.270', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.894', 'weapon2': '1.194', 'weapon3': '1.998'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:12,105][63769] DAMAGECOUNT value on done: 3040.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:12,250][63770] DAMAGECOUNT value on done: 2086.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:12,251][63770] Sum rewards: -0.213, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.124', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.011', 'ARMOR': '0.044', 'AMMO3': '0.085', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.450', 'weapon2': '1.304', 'weapon3': '1.540', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:12,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11127.4, 300 sec: 11343.8). Total num frames: 6438912. Throughput: 0: 1308.4, 1: 1477.2. Samples: 1607823. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:12,460][109198] Avg episode reward: [(0, '-4.181'), (1, '-4.826')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:12,463][63454] Saving new best policy, reward=-4.181!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:12,465][63732] Updated weights for policy 0, policy_version 780 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:12,541][63769] DAMAGECOUNT value on done: 1781.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:12,541][63769] Sum rewards: -3.008, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.876', 'AMMO2': '0.019', 'weapon4': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.095', 'WEAPON4': '0.100', 'AMMO3': '0.105', 'HITCOUNT': '0.130', 'DAMAGECOUNT': '0.498', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.014', 'weapon3': '1.704'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:16,269][63767] DAMAGECOUNT value on done: 3350.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:16,270][63767] Sum rewards: -4.001, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.800', 'weapon5': '0.006', 'AMMO5': '0.007', 'AMMO2': '0.038', 'AMMO3': '0.078', 'WEAPON5': '0.100', 'ARMOR': '0.129', 'HITCOUNT': '0.160', 'weapon4': '0.176', 'AMMO4': '0.188', 'WEAPON3': '0.500', 'WEAPON4': '0.500', 'DAMAGECOUNT': '0.756', 'weapon3': '0.940', 'FRAGCOUNT': '1.000', 'weapon2': '1.470'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:16,621][63767] DAMAGECOUNT value on done: 2881.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:16,622][63767] Sum rewards: -0.259, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.745', 'AMMO2': '0.018', 'AMMO5': '0.019', 'weapon5': '0.042', 'AMMO4': '0.088', 'weapon4': '0.094', 'AMMO3': '0.154', 'WEAPON4': '0.200', 'HITCOUNT': '0.310', 'WEAPON5': '0.400', 'WEAPON3': '0.850', 'weapon2': '1.100', 'DAMAGECOUNT': '1.278', 'weapon3': '2.182', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:17,252][63733] Updated weights for policy 1, policy_version 800 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:17,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11195.7, 300 sec: 11343.8). Total num frames: 6496256. Throughput: 0: 1307.7, 1: 1475.3. Samples: 1616183. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:17,460][109198] Avg episode reward: [(0, '-4.119'), (1, '-4.809')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:17,466][63454] Saving new best policy, reward=-4.119!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:17,862][63767] DAMAGECOUNT value on done: 3380.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:17,862][63767] Sum rewards: -1.411, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.610', 'ARMOR': '0.008', 'AMMO2': '0.010', 'AMMO5': '0.010', 'AMMO4': '0.048', 'AMMO3': '0.082', 'weapon5': '0.094', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.180', 'weapon4': '0.230', 'WEAPON3': '0.500', 'weapon3': '0.984', 'DAMAGECOUNT': '1.119', 'weapon2': '1.884', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:18,218][63767] DAMAGECOUNT value on done: 3504.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:18,219][63767] Sum rewards: -2.843, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.900', 'AMMO5': '0.012', 'AMMO2': '0.021', 'weapon5': '0.048', 'AMMO3': '0.084', 'HITCOUNT': '0.100', 'AMMO4': '0.103', 'weapon4': '0.104', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.162', 'weapon3': '1.782'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:19,963][63805] DAMAGECOUNT value on done: 2409.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:19,964][63805] Sum rewards: -5.202, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.000', 'HEALTH': '-0.642', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'AMMO5': '0.013', 'weapon4': '0.042', 'WEAPON4': '0.050', 'AMMO4': '0.053', 'AMMO3': '0.093', 'HITCOUNT': '0.160', 'weapon5': '0.174', 'WEAPON5': '0.200', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.122', 'weapon2': '1.316', 'weapon3': '1.546'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:20,258][63732] Updated weights for policy 0, policy_version 790 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:20,356][63805] DAMAGECOUNT value on done: 2950.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:20,356][63805] Sum rewards: 0.160, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.488', 'AMMO5': '0.005', 'weapon5': '0.016', 'AMMO2': '0.018', 'WEAPON5': '0.050', 'weapon7': '0.060', 'AMMO4': '0.091', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'ARMOR': '0.108', 'HITCOUNT': '0.120', 'AMMO3': '0.126', 'WEAPON4': '0.200', 'weapon4': '0.312', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.945', 'weapon3': '1.100', 'weapon2': '1.296', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:20,950][63734] DAMAGECOUNT value on done: 2031.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:21,294][63734] DAMAGECOUNT value on done: 2601.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:22,458][109198] Fps is (10 sec: 11059.4, 60 sec: 11059.2, 300 sec: 11316.1). Total num frames: 6549504. Throughput: 0: 1306.9, 1: 1471.6. Samples: 1632826. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:22,459][109198] Avg episode reward: [(0, '-3.983'), (1, '-4.816')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:22,461][63454] Saving new best policy, reward=-3.983!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:23,774][63770] DAMAGECOUNT value on done: 1817.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:23,775][63770] Sum rewards: -2.323, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.696', 'ARMOR': '0.008', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.023', 'HITCOUNT': '0.050', 'weapon5': '0.082', 'AMMO4': '0.115', 'weapon4': '0.126', 'AMMO3': '0.140', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.336', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.320', 'weapon3': '1.602'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:24,124][63770] DAMAGECOUNT value on done: 2441.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:24,315][63733] Updated weights for policy 1, policy_version 810 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:24,482][63806] DAMAGECOUNT value on done: 2721.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:24,483][63806] Sum rewards: -4.631, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.460', 'AMMO5': '0.005', 'AMMO2': '0.008', 'weapon5': '0.018', 'AMMO4': '0.039', 'ARMOR': '0.044', 'HITCOUNT': '0.060', 'weapon4': '0.068', 'AMMO3': '0.076', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.225', 'WEAPON3': '0.400', 'weapon3': '0.674', 'weapon2': '1.762', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:24,676][63805] DAMAGECOUNT value on done: 2535.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:24,823][63806] DAMAGECOUNT value on done: 1828.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:25,155][63805] DAMAGECOUNT value on done: 3083.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:25,155][63805] Sum rewards: -1.366, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.760', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'AMMO5': '0.005', 'WEAPON4': '0.050', 'HITCOUNT': '0.050', 'weapon4': '0.094', 'ARMOR': '0.096', 'WEAPON5': '0.100', 'AMMO3': '0.120', 'DAMAGECOUNT': '0.195', 'WEAPON3': '0.800', 'weapon2': '1.114', 'weapon3': '1.528', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:27,459][109198] Fps is (10 sec: 10649.0, 60 sec: 11059.1, 300 sec: 11316.0). Total num frames: 6602752. Throughput: 0: 1301.9, 1: 1466.6. Samples: 1649044. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:27,460][109198] Avg episode reward: [(0, '-3.942'), (1, '-4.695')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:27,468][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000814_3334144.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:27,495][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000799_3272704.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:27,524][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000505_2068480.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:27,532][63576] Saving new best policy, reward=-4.695!\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:27,567][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000447_1830912.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:27,576][63454] Saving new best policy, reward=-3.942!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:28,310][63732] Updated weights for policy 0, policy_version 800 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:29,451][63735] DAMAGECOUNT value on done: 2197.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:29,451][63735] Sum rewards: -2.832, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.468', 'AMMO5': '0.003', 'weapon5': '0.006', 'WEAPON1': '0.010', 'AMMO2': '0.020', 'WEAPON5': '0.050', 'ARMOR': '0.092', 'AMMO4': '0.099', 'AMMO3': '0.131', 'WEAPON4': '0.150', 'HITCOUNT': '0.180', 'weapon4': '0.206', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.774', 'weapon3': '0.996', 'weapon2': '1.320', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:29,846][63735] DAMAGECOUNT value on done: 2220.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:29,847][63735] Sum rewards: -4.449, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.010', 'AMMO5': '0.010', 'weapon5': '0.010', 'AMMO2': '0.011', 'AMMO4': '0.052', 'weapon4': '0.064', 'WEAPON5': '0.100', 'HITCOUNT': '0.100', 'AMMO3': '0.128', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.082', 'weapon2': '1.324'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:30,959][63735] DAMAGECOUNT value on done: 3104.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:30,960][63735] Sum rewards: -1.408, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.724', 'WEAPON1': '0.010', 'AMMO2': '0.019', 'AMMO4': '0.092', 'AMMO3': '0.121', 'HITCOUNT': '0.210', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.726', 'weapon3': '1.336', 'weapon2': '1.602', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:31,186][63733] Updated weights for policy 1, policy_version 820 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:31,382][63735] DAMAGECOUNT value on done: 2895.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:31,382][63735] Sum rewards: -4.250, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.412', 'AMMO4': '-0.010', 'AMMO2': '-0.002', 'AMMO5': '0.003', 'weapon5': '0.012', 'WEAPON5': '0.050', 'HITCOUNT': '0.110', 'ARMOR': '0.112', 'AMMO3': '0.158', 'DAMAGECOUNT': '0.369', 'WEAPON3': '0.900', 'weapon2': '0.996', 'FRAGCOUNT': '1.000', 'weapon3': '1.714'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:32,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11127.5, 300 sec: 11316.1). Total num frames: 6660096. Throughput: 0: 1303.0, 1: 1470.5. Samples: 1657581. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:32,460][109198] Avg episode reward: [(0, '-3.946'), (1, '-4.588')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:32,461][63576] Saving new best policy, reward=-4.588!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:32,503][63734] DAMAGECOUNT value on done: 3209.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:32,503][63734] Sum rewards: -6.547, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.488', 'AMMO5': '0.012', 'AMMO2': '0.020', 'weapon5': '0.080', 'AMMO4': '0.099', 'weapon4': '0.134', 'AMMO3': '0.146', 'WEAPON4': '0.150', 'HITCOUNT': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.762', 'WEAPON3': '0.850', 'weapon2': '1.440', 'weapon3': '1.548', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:32,930][63734] DAMAGECOUNT value on done: 2218.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:34,095][63771] DAMAGECOUNT value on done: 2235.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:34,095][63771] Sum rewards: -5.857, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.647', 'AMMO2': '0.016', 'ARMOR': '0.024', 'HITCOUNT': '0.070', 'weapon4': '0.078', 'AMMO4': '0.082', 'WEAPON4': '0.150', 'AMMO3': '0.153', 'DAMAGECOUNT': '0.225', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.122', 'weapon3': '1.670'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:34,474][63771] DAMAGECOUNT value on done: 3328.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:35,460][63806] DAMAGECOUNT value on done: 3024.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:35,460][63806] Sum rewards: -1.744, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.310', 'AMMO2': '0.003', 'AMMO5': '0.010', 'weapon4': '0.014', 'AMMO4': '0.017', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.142', 'HITCOUNT': '0.180', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.780', 'weapon2': '1.268', 'weapon3': '1.502', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:35,823][63806] DAMAGECOUNT value on done: 3239.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:36,000][63732] Updated weights for policy 0, policy_version 810 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:36,146][63771] DAMAGECOUNT value on done: 2334.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:36,146][63771] Sum rewards: -1.687, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO2': '0.007', 'AMMO5': '0.009', 'weapon5': '0.022', 'AMMO4': '0.036', 'ARMOR': '0.048', 'WEAPON4': '0.050', 'AMMO3': '0.117', 'HITCOUNT': '0.140', 'weapon4': '0.170', 'WEAPON5': '0.200', 'HEALTH': '0.280', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.603', 'FRAGCOUNT': '1.000', 'weapon2': '1.218', 'weapon3': '1.362'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:36,447][63771] DAMAGECOUNT value on done: 2218.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:36,670][63769] DAMAGECOUNT value on done: 2141.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:36,670][63769] Sum rewards: -7.430, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.629', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO2': '0.016', 'weapon4': '0.020', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'HITCOUNT': '0.070', 'AMMO4': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.179', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.390', 'weapon2': '1.444'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:37,124][63769] DAMAGECOUNT value on done: 2623.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:37,125][63769] Sum rewards: -4.854, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.068', 'AMMO2': '0.022', 'ARMOR': '0.044', 'AMMO4': '0.108', 'AMMO3': '0.115', 'weapon4': '0.146', 'HITCOUNT': '0.180', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.639', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.130', 'weapon2': '1.830'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:37,458][109198] Fps is (10 sec: 11059.8, 60 sec: 11059.2, 300 sec: 11302.2). Total num frames: 6713344. Throughput: 0: 1299.7, 1: 1467.9. Samples: 1674244. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:37,460][109198] Avg episode reward: [(0, '-3.928'), (1, '-4.608')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:37,468][63454] Saving new best policy, reward=-3.928!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:37,718][63770] DAMAGECOUNT value on done: 3035.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:37,719][63770] Sum rewards: -1.988, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.295', 'AMMO5': '0.007', 'AMMO2': '0.030', 'weapon7': '0.058', 'weapon4': '0.078', 'HITCOUNT': '0.080', 'AMMO3': '0.096', 'WEAPON5': '0.100', 'AMMO4': '0.148', 'DAMAGECOUNT': '0.240', 'WEAPON4': '0.250', 'AMMO6': '0.260', 'AMMO7': '0.260', 'WEAPON7': '0.300', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon2': '1.146', 'weapon3': '2.004'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:37,812][63769] DAMAGECOUNT value on done: 3443.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:37,813][63769] Sum rewards: 1.461, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.905', 'AMMO5': '0.009', 'ARMOR': '0.016', 'AMMO2': '0.030', 'AMMO3': '0.070', 'weapon5': '0.142', 'AMMO4': '0.147', 'WEAPON4': '0.150', 'weapon4': '0.160', 'WEAPON5': '0.200', 'HITCOUNT': '0.250', 'WEAPON3': '0.400', 'weapon3': '0.890', 'DAMAGECOUNT': '1.209', 'weapon2': '1.692', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:38,077][63770] DAMAGECOUNT value on done: 2186.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:38,077][63770] Sum rewards: -4.205, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.344', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.005', 'ARMOR': '0.028', 'HITCOUNT': '0.070', 'WEAPON5': '0.100', 'AMMO3': '0.135', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.298', 'weapon3': '1.666'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:38,187][63733] Updated weights for policy 1, policy_version 830 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:38,220][63769] DAMAGECOUNT value on done: 1811.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:38,999][63767] DAMAGECOUNT value on done: 3681.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:39,000][63767] Sum rewards: -6.860, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.216', 'AMMO5': '0.007', 'AMMO2': '0.028', 'weapon5': '0.050', 'ARMOR': '0.064', 'AMMO4': '0.141', 'AMMO3': '0.148', 'WEAPON5': '0.200', 'weapon4': '0.202', 'HITCOUNT': '0.290', 'WEAPON4': '0.400', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.993', 'weapon3': '1.318', 'weapon2': '1.464'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:39,382][63767] DAMAGECOUNT value on done: 3070.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:39,383][63767] Sum rewards: -1.774, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.578', 'weapon5': '0.006', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'AMMO5': '0.013', 'AMMO4': '0.042', 'weapon4': '0.046', 'WEAPON4': '0.050', 'ARMOR': '0.076', 'AMMO3': '0.109', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.567', 'WEAPON3': '0.750', 'weapon3': '1.416', 'weapon2': '1.600', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:40,569][63767] DAMAGECOUNT value on done: 3615.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:40,569][63767] Sum rewards: 0.275, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.391', 'ARMOR': '0.004', 'AMMO2': '0.022', 'AMMO5': '0.033', 'AMMO3': '0.108', 'AMMO4': '0.110', 'weapon5': '0.152', 'HITCOUNT': '0.160', 'weapon4': '0.166', 'WEAPON4': '0.250', 'WEAPON5': '0.450', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.705', 'weapon2': '0.872', 'weapon3': '1.734', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:40,954][63767] DAMAGECOUNT value on done: 3709.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:40,954][63767] Sum rewards: -2.623, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.751', 'AMMO5': '0.013', 'ARMOR': '0.016', 'weapon5': '0.028', 'AMMO2': '0.029', 'AMMO3': '0.113', 'AMMO4': '0.144', 'weapon4': '0.156', 'HITCOUNT': '0.160', 'WEAPON5': '0.250', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.615', 'WEAPON3': '0.700', 'weapon3': '1.260', 'weapon2': '1.544', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:42,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11059.2, 300 sec: 11302.2). Total num frames: 6770688. Throughput: 0: 1299.8, 1: 1465.8. Samples: 1690767. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:42,460][109198] Avg episode reward: [(0, '-3.659'), (1, '-4.592')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:42,461][63454] Saving new best policy, reward=-3.659!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:42,984][63805] DAMAGECOUNT value on done: 2707.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:42,984][63805] Sum rewards: -6.710, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.734', 'ARMOR': '0.004', 'weapon5': '0.014', 'AMMO5': '0.028', 'AMMO2': '0.030', 'AMMO3': '0.148', 'AMMO4': '0.149', 'weapon4': '0.220', 'HITCOUNT': '0.250', 'WEAPON4': '0.300', 'WEAPON5': '0.450', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.894', 'FRAGCOUNT': '1.000', 'weapon2': '1.210', 'weapon3': '1.478'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:43,352][63805] DAMAGECOUNT value on done: 3187.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:43,353][63805] Sum rewards: 0.943, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.484', 'AMMO5': '0.005', 'weapon5': '0.022', 'AMMO2': '0.029', 'AMMO3': '0.081', 'WEAPON5': '0.100', 'AMMO4': '0.147', 'weapon4': '0.166', 'HITCOUNT': '0.180', 'WEAPON4': '0.250', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.711', 'weapon2': '1.444', 'weapon3': '1.592', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:43,860][63732] Updated weights for policy 0, policy_version 820 (0.0009)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:44,823][63734] DAMAGECOUNT value on done: 2090.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:44,824][63734] Sum rewards: -2.451, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.520', 'AMMO2': '0.013', 'AMMO4': '0.065', 'HITCOUNT': '0.070', 'AMMO3': '0.072', 'WEAPON4': '0.100', 'ARMOR': '0.131', 'DAMAGECOUNT': '0.177', 'weapon4': '0.396', 'WEAPON3': '0.450', 'weapon2': '0.974', 'FRAGCOUNT': '1.000', 'weapon3': '1.370'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:45,184][63733] Updated weights for policy 1, policy_version 840 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:45,219][63734] DAMAGECOUNT value on done: 2726.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:45,220][63734] Sum rewards: -5.562, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.006', 'AMMO5': '0.003', 'weapon5': '0.008', 'AMMO2': '0.014', 'WEAPON5': '0.050', 'AMMO4': '0.069', 'HITCOUNT': '0.080', 'weapon4': '0.094', 'WEAPON4': '0.100', 'AMMO3': '0.104', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.266', 'weapon2': '1.432'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:47,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11059.2, 300 sec: 11302.2). Total num frames: 6828032. Throughput: 0: 1303.5, 1: 1465.7. Samples: 1699263. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:47,459][109198] Avg episode reward: [(0, '-3.619'), (1, '-4.583')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:47,465][63576] Saving new best policy, reward=-4.583!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:47,465][63454] Saving new best policy, reward=-3.619!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:47,721][63806] DAMAGECOUNT value on done: 2971.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:47,722][63806] Sum rewards: -6.022, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.188', 'AMMO5': '0.010', 'AMMO2': '0.016', 'ARMOR': '0.044', 'AMMO4': '0.077', 'AMMO3': '0.179', 'weapon4': '0.188', 'HITCOUNT': '0.190', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.750', 'WEAPON3': '0.950', 'weapon2': '1.098', 'weapon3': '1.514', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:48,116][63806] DAMAGECOUNT value on done: 1843.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:48,116][63806] Sum rewards: -10.509, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.387', 'AMMO5': '0.005', 'AMMO2': '0.005', 'WEAPON1': '0.010', 'ARMOR': '0.016', 'HITCOUNT': '0.020', 'AMMO4': '0.026', 'weapon4': '0.030', 'DAMAGECOUNT': '0.045', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.162', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.196', 'weapon2': '1.862'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:49,447][63770] DAMAGECOUNT value on done: 1952.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:49,447][63770] Sum rewards: -6.017, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.992', 'AMMO2': '0.012', 'AMMO5': '0.022', 'weapon5': '0.028', 'AMMO4': '0.061', 'HITCOUNT': '0.110', 'AMMO3': '0.123', 'WEAPON4': '0.200', 'weapon4': '0.266', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.405', 'ARMOR': '0.448', 'WEAPON3': '0.750', 'weapon2': '1.152', 'weapon3': '1.548'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:49,589][63805] DAMAGECOUNT value on done: 2855.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:49,589][63805] Sum rewards: -1.030, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.204', 'weapon4': '0.002', 'AMMO2': '0.002', 'AMMO4': '0.011', 'AMMO5': '0.017', 'ARMOR': '0.040', 'weapon5': '0.056', 'AMMO3': '0.087', 'WEAPON4': '0.100', 'WEAPON5': '0.250', 'HITCOUNT': '0.250', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.960', 'weapon3': '1.260', 'weapon2': '1.938', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:49,790][63770] DAMAGECOUNT value on done: 2511.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:49,791][63770] Sum rewards: -2.923, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.510', 'AMMO2': '0.006', 'AMMO4': '0.031', 'ARMOR': '0.040', 'HITCOUNT': '0.070', 'weapon4': '0.082', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.700', 'weapon2': '0.948', 'FRAGCOUNT': '1.000', 'weapon3': '1.792'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:49,954][63805] DAMAGECOUNT value on done: 3098.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:51,783][63732] Updated weights for policy 0, policy_version 830 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:52,143][63733] Updated weights for policy 1, policy_version 850 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:52,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11127.5, 300 sec: 11288.3). Total num frames: 6885376. Throughput: 0: 1302.7, 1: 1466.7. Samples: 1715910. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:52,461][109198] Avg episode reward: [(0, '-3.636'), (1, '-4.616')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:53,815][63735] DAMAGECOUNT value on done: 3319.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:53,816][63735] Sum rewards: -3.131, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.760', 'AMMO2': '0.002', 'AMMO4': '0.007', 'WEAPON4': '0.050', 'ARMOR': '0.088', 'AMMO3': '0.127', 'weapon4': '0.156', 'HITCOUNT': '0.160', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.318', 'weapon3': '1.626'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:54,144][63735] DAMAGECOUNT value on done: 2502.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:54,145][63735] Sum rewards: -3.014, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.049', 'AMMO2': '0.021', 'AMMO5': '0.037', 'weapon5': '0.058', 'AMMO4': '0.104', 'AMMO3': '0.142', 'WEAPON4': '0.200', 'weapon4': '0.200', 'HITCOUNT': '0.240', 'WEAPON5': '0.550', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.915', 'weapon2': '1.220', 'weapon3': '1.548', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:54,198][63735] DAMAGECOUNT value on done: 3137.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:54,199][63735] Sum rewards: -2.967, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.460', 'AMMO2': '0.011', 'weapon4': '0.022', 'ARMOR': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.057', 'AMMO3': '0.111', 'HITCOUNT': '0.240', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.726', 'FRAGCOUNT': '1.000', 'weapon2': '1.318', 'weapon3': '1.708'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:54,523][63735] DAMAGECOUNT value on done: 2310.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:54,523][63735] Sum rewards: -4.228, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.400', 'AMMO2': '0.016', 'ARMOR': '0.040', 'HITCOUNT': '0.080', 'AMMO4': '0.081', 'AMMO3': '0.106', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.144', 'weapon3': '1.634'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:56,858][63771] DAMAGECOUNT value on done: 2264.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:57,211][63771] DAMAGECOUNT value on done: 3593.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:57,211][63771] Sum rewards: -7.907, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-3.060', 'AMMO4': '-0.045', 'AMMO2': '-0.009', 'AMMO5': '0.005', 'weapon5': '0.006', 'ARMOR': '0.044', 'WEAPON5': '0.100', 'AMMO3': '0.144', 'HITCOUNT': '0.220', 'DAMAGECOUNT': '0.795', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.306', 'weapon3': '1.886'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:57,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11127.5, 300 sec: 11274.4). Total num frames: 6938624. Throughput: 0: 1306.9, 1: 1473.1. Samples: 1732920. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:46:57,460][109198] Avg episode reward: [(0, '-3.669'), (1, '-4.559')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:57,466][63576] Saving new best policy, reward=-4.559!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:57,953][63734] DAMAGECOUNT value on done: 3411.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:58,361][63734] DAMAGECOUNT value on done: 2278.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:58,362][63734] Sum rewards: -4.476, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.180', 'AMMO2': '0.004', 'AMMO4': '0.018', 'ARMOR': '0.048', 'HITCOUNT': '0.060', 'weapon4': '0.060', 'WEAPON4': '0.100', 'AMMO3': '0.168', 'DAMAGECOUNT': '0.180', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.248', 'weapon3': '1.918'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:58,969][63733] Updated weights for policy 1, policy_version 860 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:46:59,426][63732] Updated weights for policy 0, policy_version 840 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:00,512][63806] DAMAGECOUNT value on done: 3240.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:00,512][63806] Sum rewards: -4.430, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.811', 'AMMO2': '0.036', 'ARMOR': '0.052', 'AMMO3': '0.117', 'HITCOUNT': '0.140', 'AMMO4': '0.178', 'weapon4': '0.264', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.648', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.262', 'weapon3': '1.384'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:00,719][63771] DAMAGECOUNT value on done: 2659.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:00,719][63771] Sum rewards: -7.757, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-3.112', 'AMMO2': '0.013', 'AMMO5': '0.029', 'ARMOR': '0.040', 'AMMO4': '0.063', 'weapon5': '0.076', 'AMMO3': '0.176', 'WEAPON4': '0.200', 'HITCOUNT': '0.240', 'weapon4': '0.304', 'WEAPON5': '0.500', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.975', 'FRAGCOUNT': '1.000', 'weapon2': '1.412', 'weapon3': '1.428'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:00,885][63806] DAMAGECOUNT value on done: 3319.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:00,886][63806] Sum rewards: -5.703, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.090', 'ARMOR': '0.004', 'AMMO5': '0.005', 'weapon5': '0.012', 'AMMO2': '0.033', 'WEAPON5': '0.050', 'HITCOUNT': '0.070', 'AMMO3': '0.082', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO4': '0.167', 'DAMAGECOUNT': '0.240', 'weapon4': '0.324', 'WEAPON4': '0.400', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon3': '1.060', 'weapon2': '1.740'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:01,138][63767] DAMAGECOUNT value on done: 3971.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:01,138][63767] Sum rewards: -5.526, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.386', 'AMMO2': '0.005', 'AMMO5': '0.015', 'AMMO4': '0.022', 'WEAPON1': '0.040', 'weapon5': '0.054', 'AMMO3': '0.074', 'WEAPON4': '0.150', 'HITCOUNT': '0.220', 'weapon4': '0.224', 'WEAPON5': '0.300', 'WEAPON3': '0.450', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.870', 'weapon3': '1.286', 'weapon2': '1.400'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:01,139][63771] DAMAGECOUNT value on done: 2258.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:01,481][63767] DAMAGECOUNT value on done: 3320.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:01,481][63767] Sum rewards: -3.405, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.859', 'AMMO5': '0.010', 'weapon5': '0.012', 'AMMO2': '0.014', 'ARMOR': '0.040', 'AMMO4': '0.069', 'AMMO3': '0.119', 'WEAPON5': '0.200', 'HITCOUNT': '0.200', 'WEAPON4': '0.250', 'weapon4': '0.550', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.750', 'weapon3': '1.224', 'weapon2': '1.316', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:02,088][63769] DAMAGECOUNT value on done: 2301.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:02,088][63769] Sum rewards: -4.897, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.223', 'AMMO5': '0.010', 'weapon5': '0.010', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'weapon4': '0.052', 'AMMO4': '0.058', 'ARMOR': '0.060', 'WEAPON4': '0.100', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'AMMO3': '0.160', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.270', 'weapon2': '1.554'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:02,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11127.5, 300 sec: 11288.3). Total num frames: 6995968. Throughput: 0: 1308.6, 1: 1473.4. Samples: 1741372. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:02,460][109198] Avg episode reward: [(0, '-3.610'), (1, '-4.557')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:02,461][63576] Saving new best policy, reward=-4.557!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:02,513][63454] Saving new best policy, reward=-3.610!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:02,519][63769] DAMAGECOUNT value on done: 2917.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:02,519][63769] Sum rewards: -0.137, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.339', 'weapon7': '0.002', 'ARMOR': '0.004', 'AMMO5': '0.005', 'AMMO2': '0.022', 'WEAPON5': '0.050', 'weapon4': '0.096', 'AMMO4': '0.110', 'AMMO3': '0.147', 'WEAPON4': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.240', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.882', 'weapon2': '1.072', 'FRAGCOUNT': '2.000', 'weapon3': '2.272'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:02,633][63767] DAMAGECOUNT value on done: 3784.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:02,634][63767] Sum rewards: 0.089, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO5': '0.008', 'AMMO2': '0.028', 'weapon5': '0.032', 'AMMO3': '0.067', 'weapon7': '0.080', 'HITCOUNT': '0.090', 'WEAPON5': '0.100', 'AMMO4': '0.141', 'HEALTH': '0.192', 'WEAPON4': '0.200', 'AMMO6': '0.320', 'AMMO7': '0.320', 'weapon4': '0.346', 'WEAPON7': '0.400', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.507', 'FRAGCOUNT': '1.000', 'weapon3': '1.116', 'weapon2': '1.492'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:02,940][63767] DAMAGECOUNT value on done: 3839.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:02,941][63767] Sum rewards: -0.198, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.550', 'AMMO2': '0.010', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'weapon5': '0.044', 'AMMO4': '0.052', 'weapon4': '0.058', 'HITCOUNT': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.119', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.450', 'weapon2': '1.288', 'weapon3': '1.486', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:03,121][63769] DAMAGECOUNT value on done: 3458.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:03,122][63769] Sum rewards: -4.240, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.164', 'AMMO5': '0.007', 'HITCOUNT': '0.010', 'weapon5': '0.016', 'AMMO2': '0.017', 'ARMOR': '0.040', 'DAMAGECOUNT': '0.045', 'WEAPON5': '0.050', 'AMMO4': '0.083', 'AMMO3': '0.121', 'WEAPON4': '0.250', 'weapon4': '0.360', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.112', 'weapon2': '1.362'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:03,266][63770] DAMAGECOUNT value on done: 3261.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:03,506][63769] DAMAGECOUNT value on done: 1924.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:03,596][63770] DAMAGECOUNT value on done: 2261.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:05,762][63805] DAMAGECOUNT value on done: 3037.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:05,763][63805] Sum rewards: -1.948, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.532', 'AMMO2': '0.002', 'AMMO5': '0.010', 'AMMO4': '0.012', 'ARMOR': '0.020', 'WEAPON4': '0.050', 'weapon4': '0.118', 'AMMO3': '0.188', 'WEAPON5': '0.200', 'HITCOUNT': '0.340', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.990', 'weapon2': '1.138', 'weapon3': '2.216', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:05,827][63733] Updated weights for policy 1, policy_version 870 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:06,098][63805] DAMAGECOUNT value on done: 3402.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:06,099][63805] Sum rewards: -3.745, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.059', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.005', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'AMMO4': '0.022', 'weapon4': '0.026', 'weapon7': '0.044', 'ARMOR': '0.068', 'AMMO3': '0.075', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.108', 'HITCOUNT': '0.190', 'WEAPON5': '0.250', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.645', 'weapon3': '1.198', 'weapon2': '1.800'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:07,167][63732] Updated weights for policy 0, policy_version 850 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:07,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11195.7, 300 sec: 11288.3). Total num frames: 7053312. Throughput: 0: 1309.5, 1: 1478.2. Samples: 1758273. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:07,460][109198] Avg episode reward: [(0, '-3.400'), (1, '-4.579')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:07,465][63454] Saving new best policy, reward=-3.400!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:08,038][63734] DAMAGECOUNT value on done: 2319.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:08,038][63734] Sum rewards: -3.497, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.594', 'weapon5': '0.004', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.032', 'ARMOR': '0.081', 'WEAPON5': '0.100', 'AMMO3': '0.101', 'AMMO4': '0.160', 'HITCOUNT': '0.170', 'WEAPON4': '0.350', 'weapon4': '0.358', 'WEAPON3': '0.500', 'weapon3': '0.574', 'DAMAGECOUNT': '0.687', 'FRAGCOUNT': '1.000', 'weapon2': '1.962'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:08,382][63734] DAMAGECOUNT value on done: 2781.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:10,569][63806] DAMAGECOUNT value on done: 3076.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:10,570][63806] Sum rewards: -0.879, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.255', 'AMMO5': '0.003', 'AMMO2': '0.029', 'weapon4': '0.062', 'AMMO3': '0.071', 'HITCOUNT': '0.090', 'AMMO4': '0.144', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.400', 'ARMOR': '0.408', 'weapon3': '0.946', 'FRAGCOUNT': '1.000', 'weapon2': '1.008'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:10,882][63806] DAMAGECOUNT value on done: 2117.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:10,882][63806] Sum rewards: -3.677, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.302', 'AMMO2': '0.018', 'weapon4': '0.054', 'ARMOR': '0.080', 'AMMO4': '0.087', 'WEAPON4': '0.100', 'AMMO3': '0.166', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.822', 'WEAPON3': '0.900', 'weapon2': '1.436', 'weapon3': '1.502', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:12,458][109198] Fps is (10 sec: 11059.0, 60 sec: 11127.5, 300 sec: 11274.4). Total num frames: 7106560. Throughput: 0: 1318.7, 1: 1488.2. Samples: 1775350. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:12,460][109198] Avg episode reward: [(0, '-3.400'), (1, '-4.583')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:12,589][63733] Updated weights for policy 1, policy_version 880 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:14,205][63805] DAMAGECOUNT value on done: 3171.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:14,205][63805] Sum rewards: -1.214, reward structure: {'DEATHCOUNT': '-9.000', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.021', 'weapon5': '0.082', 'AMMO3': '0.085', 'AMMO4': '0.104', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'HITCOUNT': '0.260', 'WEAPON3': '0.450', 'HEALTH': '0.456', 'weapon4': '0.506', 'DAMAGECOUNT': '0.948', 'weapon2': '1.054', 'weapon3': '1.502', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:14,640][63805] DAMAGECOUNT value on done: 3117.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:14,837][63770] DAMAGECOUNT value on done: 2207.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:14,838][63770] Sum rewards: -7.823, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-2.000', 'HEALTH': '-1.570', 'AMMO5': '0.012', 'AMMO2': '0.015', 'weapon5': '0.050', 'AMMO4': '0.076', 'AMMO3': '0.138', 'weapon4': '0.168', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.765', 'weapon2': '1.042', 'weapon3': '1.850'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:14,844][63732] Updated weights for policy 0, policy_version 860 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:15,199][63770] DAMAGECOUNT value on done: 2821.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:15,200][63770] Sum rewards: -2.958, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.532', 'AMMO5': '0.003', 'weapon5': '0.004', 'AMMO2': '0.012', 'WEAPON5': '0.050', 'AMMO4': '0.062', 'AMMO3': '0.157', 'HITCOUNT': '0.260', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.930', 'weapon2': '1.210', 'weapon3': '1.786', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:16,239][63735] DAMAGECOUNT value on done: 3354.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:16,536][63735] DAMAGECOUNT value on done: 3287.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:16,537][63735] Sum rewards: -3.313, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.920', 'ARMOR': '0.004', 'AMMO2': '0.021', 'weapon4': '0.032', 'AMMO3': '0.102', 'AMMO4': '0.106', 'HITCOUNT': '0.120', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.216', 'weapon2': '1.256'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:17,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11195.7, 300 sec: 11288.3). Total num frames: 7168000. Throughput: 0: 1319.6, 1: 1484.7. Samples: 1783771. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:17,460][109198] Avg episode reward: [(0, '-3.408'), (1, '-4.471')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:17,468][63576] Saving new best policy, reward=-4.471!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:18,233][63735] DAMAGECOUNT value on done: 2566.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:18,539][63735] DAMAGECOUNT value on done: 2375.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:19,443][63733] Updated weights for policy 1, policy_version 890 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:19,887][63771] DAMAGECOUNT value on done: 2304.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:20,277][63771] DAMAGECOUNT value on done: 3766.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:20,277][63771] Sum rewards: -3.882, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.346', 'AMMO5': '0.003', 'AMMO2': '0.004', 'AMMO4': '0.019', 'ARMOR': '0.050', 'WEAPON4': '0.100', 'AMMO3': '0.115', 'HITCOUNT': '0.120', 'weapon4': '0.130', 'DAMAGECOUNT': '0.519', 'WEAPON3': '0.600', 'weapon2': '1.324', 'weapon3': '1.480', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:22,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11195.7, 300 sec: 11260.5). Total num frames: 7221248. Throughput: 0: 1321.1, 1: 1489.2. Samples: 1800708. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:22,460][109198] Avg episode reward: [(0, '-3.416'), (1, '-4.459')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:22,462][63576] Saving new best policy, reward=-4.459!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:22,512][63732] Updated weights for policy 0, policy_version 870 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:22,936][63734] DAMAGECOUNT value on done: 3578.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:22,936][63734] Sum rewards: 2.006, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.005', 'AMMO2': '0.027', 'AMMO3': '0.050', 'ARMOR': '0.064', 'HITCOUNT': '0.070', 'weapon5': '0.082', 'WEAPON5': '0.100', 'AMMO4': '0.132', 'WEAPON4': '0.150', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.501', 'HEALTH': '0.517', 'weapon4': '0.750', 'weapon3': '1.032', 'weapon2': '1.476', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:23,123][63767] DAMAGECOUNT value on done: 4134.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:23,123][63767] Sum rewards: -1.629, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.112', 'ARMOR': '0.008', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'AMMO5': '0.020', 'weapon5': '0.086', 'AMMO4': '0.087', 'HITCOUNT': '0.130', 'AMMO3': '0.142', 'WEAPON4': '0.150', 'weapon4': '0.320', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.489', 'WEAPON3': '0.850', 'weapon2': '1.358', 'weapon3': '1.416', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:23,333][63734] DAMAGECOUNT value on done: 2307.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:23,488][63767] DAMAGECOUNT value on done: 3512.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:24,682][63767] DAMAGECOUNT value on done: 4146.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:24,683][63767] Sum rewards: -0.529, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.389', 'AMMO5': '0.020', 'WEAPON1': '0.030', 'AMMO2': '0.040', 'AMMO3': '0.060', 'ARMOR': '0.068', 'weapon5': '0.078', 'AMMO4': '0.202', 'WEAPON5': '0.250', 'WEAPON4': '0.250', 'HITCOUNT': '0.290', 'WEAPON3': '0.350', 'weapon4': '0.404', 'DAMAGECOUNT': '1.086', 'weapon3': '1.206', 'FRAGCOUNT': '1.500', 'weapon2': '1.526'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:24,831][63806] DAMAGECOUNT value on done: 3255.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:25,058][63767] DAMAGECOUNT value on done: 4244.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:25,059][63767] Sum rewards: -3.292, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.654', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.018', 'weapon5': '0.030', 'ARMOR': '0.040', 'AMMO4': '0.090', 'WEAPON5': '0.100', 'AMMO3': '0.153', 'WEAPON4': '0.200', 'HITCOUNT': '0.310', 'weapon4': '0.336', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.215', 'weapon2': '1.508', 'weapon3': '1.546', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:25,273][63806] DAMAGECOUNT value on done: 3663.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:25,274][63806] Sum rewards: 0.684, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.118', 'AMMO5': '0.015', 'ARMOR': '0.020', 'AMMO2': '0.021', 'weapon5': '0.096', 'WEAPON4': '0.100', 'AMMO4': '0.104', 'AMMO3': '0.118', 'weapon4': '0.154', 'HITCOUNT': '0.160', 'WEAPON5': '0.300', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.032', 'weapon3': '1.384', 'weapon2': '1.648', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:25,544][63771] DAMAGECOUNT value on done: 2824.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:25,544][63771] Sum rewards: -3.099, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.898', 'AMMO2': '0.008', 'AMMO5': '0.014', 'weapon5': '0.036', 'AMMO4': '0.037', 'WEAPON4': '0.050', 'AMMO3': '0.092', 'ARMOR': '0.108', 'weapon4': '0.114', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.098', 'weapon2': '1.526'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:25,952][63771] DAMAGECOUNT value on done: 2413.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:25,952][63771] Sum rewards: -3.449, reward structure: {'DEATHCOUNT': '-9.000', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.010', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'AMMO4': '0.052', 'AMMO3': '0.100', 'WEAPON5': '0.100', 'HEALTH': '0.112', 'HITCOUNT': '0.140', 'weapon4': '0.200', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.102', 'weapon3': '1.562'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:26,365][63733] Updated weights for policy 1, policy_version 900 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:27,098][63769] DAMAGECOUNT value on done: 2446.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:27,098][63769] Sum rewards: -8.579, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-3.030', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.030', 'weapon4': '0.032', 'ARMOR': '0.064', 'WEAPON5': '0.100', 'HITCOUNT': '0.120', 'AMMO4': '0.150', 'WEAPON4': '0.200', 'AMMO3': '0.214', 'DAMAGECOUNT': '0.435', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.250', 'weapon2': '1.318', 'weapon3': '1.522'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:27,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11264.1, 300 sec: 11260.5). Total num frames: 7278592. Throughput: 0: 1325.4, 1: 1491.6. Samples: 1817532. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:27,460][109198] Avg episode reward: [(0, '-3.336'), (1, '-4.477')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:27,466][63454] Saving new best policy, reward=-3.336!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:27,531][63769] DAMAGECOUNT value on done: 3007.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:27,532][63769] Sum rewards: 1.974, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-0.230', 'AMMO2': '0.002', 'AMMO5': '0.009', 'AMMO4': '0.011', 'weapon5': '0.042', 'WEAPON4': '0.050', 'AMMO3': '0.083', 'HITCOUNT': '0.090', 'weapon4': '0.094', 'ARMOR': '0.096', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.400', 'weapon3': '1.100', 'weapon2': '1.506', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:28,207][63769] DAMAGECOUNT value on done: 3598.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:28,207][63769] Sum rewards: -4.506, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.830', 'ARMOR': '0.008', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.027', 'WEAPON5': '0.050', 'AMMO4': '0.133', 'HITCOUNT': '0.140', 'AMMO3': '0.154', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.420', 'weapon4': '0.616', 'weapon3': '0.720', 'WEAPON3': '0.750', 'weapon2': '1.788', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:28,616][63769] DAMAGECOUNT value on done: 1959.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:28,620][63805] DAMAGECOUNT value on done: 3276.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:28,620][63805] Sum rewards: -2.699, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.108', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'ARMOR': '0.012', 'AMMO5': '0.027', 'AMMO4': '0.035', 'weapon5': '0.084', 'AMMO3': '0.160', 'HITCOUNT': '0.170', 'WEAPON4': '0.200', 'weapon4': '0.210', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.717', 'WEAPON3': '0.900', 'weapon2': '1.324', 'FRAGCOUNT': '1.500', 'weapon3': '1.902'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:28,635][63770] DAMAGECOUNT value on done: 3692.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:28,636][63770] Sum rewards: -1.451, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.379', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'ARMOR': '0.004', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'weapon5': '0.160', 'AMMO3': '0.195', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '1.100', 'DAMAGECOUNT': '1.293', 'weapon2': '1.378', 'weapon3': '1.892', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:29,018][63805] DAMAGECOUNT value on done: 3702.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:29,019][63805] Sum rewards: -5.185, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.485', 'AMMO2': '0.006', 'AMMO5': '0.017', 'AMMO4': '0.029', 'ARMOR': '0.036', 'weapon5': '0.038', 'AMMO3': '0.128', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'HITCOUNT': '0.250', 'weapon4': '0.386', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.900', 'weapon2': '1.324', 'weapon3': '1.686'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:29,026][63770] DAMAGECOUNT value on done: 2525.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:30,420][63732] Updated weights for policy 0, policy_version 880 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:31,655][63734] DAMAGECOUNT value on done: 2469.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:31,655][63734] Sum rewards: -0.479, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.360', 'AMMO2': '0.003', 'AMMO4': '0.014', 'ARMOR': '0.092', 'HITCOUNT': '0.100', 'AMMO3': '0.128', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.750', 'weapon2': '1.238', 'weapon3': '1.606', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:32,065][63734] DAMAGECOUNT value on done: 2851.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:32,066][63734] Sum rewards: -2.741, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.591', 'weapon5': '0.002', 'ARMOR': '0.004', 'AMMO2': '0.009', 'AMMO5': '0.010', 'AMMO4': '0.044', 'HITCOUNT': '0.080', 'AMMO3': '0.163', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.180', 'weapon2': '1.798'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:32,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11195.7, 300 sec: 11246.6). Total num frames: 7331840. Throughput: 0: 1319.2, 1: 1489.3. Samples: 1825647. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:32,460][109198] Avg episode reward: [(0, '-3.276'), (1, '-4.414')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:32,461][63454] Saving new best policy, reward=-3.276!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:32,461][63576] Saving new best policy, reward=-4.414!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:33,274][63806] DAMAGECOUNT value on done: 3196.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:33,388][63733] Updated weights for policy 1, policy_version 910 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:33,633][63806] DAMAGECOUNT value on done: 2414.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:33,633][63806] Sum rewards: -2.333, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.209', 'AMMO2': '0.000', 'AMMO4': '0.002', 'AMMO5': '0.005', 'ARMOR': '0.032', 'weapon5': '0.046', 'AMMO3': '0.090', 'WEAPON5': '0.100', 'HITCOUNT': '0.160', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.891', 'FRAGCOUNT': '1.000', 'weapon2': '1.108', 'weapon3': '1.442'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:37,458][109198] Fps is (10 sec: 10649.6, 60 sec: 11195.7, 300 sec: 11232.8). Total num frames: 7385088. Throughput: 0: 1319.7, 1: 1490.5. Samples: 1842368. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:37,460][109198] Avg episode reward: [(0, '-3.276'), (1, '-4.370')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:37,497][63576] Saving new best policy, reward=-4.370!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:38,226][63732] Updated weights for policy 0, policy_version 890 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:38,924][63735] DAMAGECOUNT value on done: 3693.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:38,924][63735] Sum rewards: -3.098, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.034', 'ARMOR': '0.004', 'AMMO5': '0.005', 'weapon5': '0.016', 'AMMO2': '0.017', 'weapon4': '0.052', 'AMMO4': '0.085', 'WEAPON5': '0.100', 'AMMO3': '0.133', 'WEAPON4': '0.150', 'HITCOUNT': '0.280', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.017', 'weapon2': '1.076', 'weapon3': '1.550', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:39,172][63805] DAMAGECOUNT value on done: 3942.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:39,172][63805] Sum rewards: 0.853, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO2': '0.004', 'AMMO5': '0.017', 'AMMO4': '0.022', 'ARMOR': '0.084', 'weapon5': '0.108', 'AMMO3': '0.132', 'HEALTH': '0.236', 'WEAPON5': '0.300', 'HITCOUNT': '0.410', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.750', 'weapon2': '1.264', 'weapon3': '2.212', 'DAMAGECOUNT': '2.313'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:39,255][63735] DAMAGECOUNT value on done: 3372.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:39,587][63805] DAMAGECOUNT value on done: 3182.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:39,587][63805] Sum rewards: -4.346, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.672', 'AMMO5': '0.007', 'AMMO2': '0.009', 'ARMOR': '0.020', 'AMMO4': '0.046', 'HITCOUNT': '0.070', 'AMMO3': '0.126', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.195', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.426', 'weapon3': '1.526'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:40,279][63733] Updated weights for policy 1, policy_version 920 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:40,294][63770] DAMAGECOUNT value on done: 2502.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:40,295][63770] Sum rewards: -8.434, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.824', 'FRAGCOUNT': '-1.000', 'AMMO2': '0.012', 'AMMO5': '0.017', 'ARMOR': '0.032', 'AMMO4': '0.062', 'weapon5': '0.074', 'WEAPON4': '0.100', 'AMMO3': '0.188', 'HITCOUNT': '0.190', 'weapon4': '0.274', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.885', 'WEAPON3': '1.100', 'weapon2': '1.456', 'weapon3': '1.700'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:40,670][63770] DAMAGECOUNT value on done: 3130.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:40,670][63770] Sum rewards: -3.501, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.847', 'AMMO5': '0.010', 'AMMO2': '0.010', 'AMMO4': '0.050', 'WEAPON4': '0.100', 'weapon4': '0.106', 'WEAPON5': '0.150', 'AMMO3': '0.200', 'HITCOUNT': '0.260', 'ARMOR': '0.412', 'weapon2': '0.770', 'DAMAGECOUNT': '0.927', 'WEAPON3': '1.200', 'weapon3': '2.150', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:42,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11264.0, 300 sec: 11232.8). Total num frames: 7446528. Throughput: 0: 1318.8, 1: 1488.3. Samples: 1859241. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:42,459][109198] Avg episode reward: [(0, '-3.265'), (1, '-4.406')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:42,461][63454] Saving new best policy, reward=-3.265!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:42,584][63735] DAMAGECOUNT value on done: 3146.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:42,584][63735] Sum rewards: -0.525, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.390', 'AMMO2': '0.015', 'AMMO5': '0.016', 'ARMOR': '0.036', 'AMMO4': '0.072', 'AMMO3': '0.114', 'weapon5': '0.128', 'WEAPON4': '0.150', 'weapon4': '0.204', 'WEAPON5': '0.300', 'HITCOUNT': '0.310', 'WEAPON3': '0.700', 'weapon2': '1.526', 'weapon3': '1.554', 'DAMAGECOUNT': '1.740', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:42,911][63735] DAMAGECOUNT value on done: 2395.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:43,395][63771] DAMAGECOUNT value on done: 2414.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:43,396][63771] Sum rewards: -5.925, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.388', 'AMMO5': '0.005', 'AMMO2': '0.008', 'WEAPON1': '0.020', 'weapon5': '0.032', 'AMMO4': '0.041', 'ARMOR': '0.056', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.122', 'weapon4': '0.146', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.076', 'weapon2': '1.326'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:43,783][63771] DAMAGECOUNT value on done: 3856.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:43,784][63771] Sum rewards: -3.385, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.093', 'AMMO5': '0.010', 'AMMO2': '0.016', 'WEAPON1': '0.030', 'HITCOUNT': '0.070', 'AMMO3': '0.075', 'AMMO4': '0.080', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon2': '1.354', 'weapon3': '1.452'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:45,752][63767] DAMAGECOUNT value on done: 4250.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:46,050][63732] Updated weights for policy 0, policy_version 900 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:46,165][63767] DAMAGECOUNT value on done: 3919.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:47,125][63733] Updated weights for policy 1, policy_version 930 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:47,435][63767] DAMAGECOUNT value on done: 4515.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:47,436][63767] Sum rewards: -5.838, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.106', 'AMMO5': '0.011', 'AMMO2': '0.029', 'weapon5': '0.128', 'AMMO4': '0.143', 'WEAPON5': '0.200', 'AMMO3': '0.214', 'HITCOUNT': '0.260', 'weapon4': '0.292', 'WEAPON4': '0.300', 'FRAGCOUNT': '0.500', 'ARMOR': '0.618', 'DAMAGECOUNT': '1.107', 'WEAPON3': '1.200', 'weapon3': '1.586', 'weapon2': '1.680'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:47,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11195.7, 300 sec: 11218.9). Total num frames: 7499776. Throughput: 0: 1318.4, 1: 1489.9. Samples: 1867748. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:47,460][109198] Avg episode reward: [(0, '-3.227'), (1, '-4.522')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:47,466][63454] Saving new best policy, reward=-3.227!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:47,819][63767] DAMAGECOUNT value on done: 4448.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:47,819][63767] Sum rewards: -5.578, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.020', 'FRAGCOUNT': '-0.500', 'ARMOR': '0.012', 'AMMO5': '0.020', 'WEAPON1': '0.020', 'AMMO2': '0.026', 'weapon5': '0.084', 'AMMO3': '0.127', 'AMMO4': '0.131', 'HITCOUNT': '0.180', 'WEAPON4': '0.300', 'WEAPON5': '0.450', 'weapon4': '0.514', 'DAMAGECOUNT': '0.612', 'WEAPON3': '0.750', 'weapon2': '1.226', 'weapon3': '1.490'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:48,353][63734] DAMAGECOUNT value on done: 4013.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:48,354][63734] Sum rewards: 0.450, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.447', 'AMMO5': '0.014', 'weapon5': '0.020', 'AMMO2': '0.020', 'ARMOR': '0.024', 'AMMO4': '0.100', 'AMMO3': '0.142', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'HITCOUNT': '0.280', 'weapon4': '0.514', 'WEAPON3': '0.750', 'weapon2': '0.890', 'DAMAGECOUNT': '1.305', 'weapon3': '1.888', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:48,760][63734] DAMAGECOUNT value on done: 2455.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:48,761][63734] Sum rewards: -7.424, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.756', 'weapon5': '0.002', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.019', 'ARMOR': '0.040', 'AMMO4': '0.093', 'HITCOUNT': '0.130', 'weapon4': '0.130', 'AMMO3': '0.135', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.444', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.004', 'weapon2': '1.512'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:49,051][63806] DAMAGECOUNT value on done: 3385.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:49,051][63806] Sum rewards: -4.172, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.281', 'AMMO2': '0.006', 'AMMO5': '0.010', 'AMMO4': '0.030', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'ARMOR': '0.105', 'AMMO3': '0.106', 'HITCOUNT': '0.120', 'weapon4': '0.120', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.202', 'weapon2': '1.520'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:49,462][63806] DAMAGECOUNT value on done: 3833.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:49,462][63806] Sum rewards: 1.252, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.152', 'AMMO5': '0.007', 'AMMO2': '0.023', 'weapon7': '0.056', 'AMMO3': '0.058', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.113', 'weapon5': '0.150', 'HITCOUNT': '0.180', 'weapon4': '0.278', 'AMMO6': '0.300', 'WEAPON7': '0.300', 'AMMO7': '0.300', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.510', 'FRAGCOUNT': '1.000', 'weapon3': '1.174', 'weapon2': '1.196', 'ARMOR': '1.208'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:50,656][63771] DAMAGECOUNT value on done: 3375.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:50,657][63771] Sum rewards: -2.204, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.101', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'AMMO5': '0.010', 'weapon5': '0.072', 'WEAPON4': '0.100', 'AMMO3': '0.152', 'WEAPON5': '0.250', 'HITCOUNT': '0.320', 'weapon4': '0.322', 'ARMOR': '0.567', 'WEAPON3': '0.750', 'weapon3': '1.534', 'DAMAGECOUNT': '1.653', 'weapon2': '1.668', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:51,038][63771] DAMAGECOUNT value on done: 2621.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:51,039][63771] Sum rewards: -6.275, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.493', 'AMMO5': '0.005', 'AMMO2': '0.012', 'ARMOR': '0.048', 'AMMO4': '0.058', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.129', 'HITCOUNT': '0.160', 'weapon4': '0.200', 'DAMAGECOUNT': '0.624', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.262', 'weapon2': '1.270'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:51,686][63805] DAMAGECOUNT value on done: 3692.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:51,687][63805] Sum rewards: -2.273, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.884', 'AMMO2': '0.019', 'WEAPON1': '0.020', 'ARMOR': '0.025', 'AMMO5': '0.031', 'AMMO4': '0.093', 'AMMO3': '0.118', 'weapon4': '0.224', 'weapon5': '0.238', 'WEAPON4': '0.250', 'HITCOUNT': '0.300', 'WEAPON5': '0.450', 'WEAPON3': '0.750', 'weapon3': '1.240', 'DAMAGECOUNT': '1.248', 'weapon2': '1.356', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:52,000][63805] DAMAGECOUNT value on done: 4353.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:52,001][63805] Sum rewards: 0.132, reward structure: {'DEATHCOUNT': '-9.750', 'AMMO5': '0.016', 'ARMOR': '0.032', 'AMMO2': '0.040', 'HEALTH': '0.048', 'AMMO3': '0.106', 'weapon5': '0.144', 'AMMO4': '0.200', 'WEAPON4': '0.250', 'WEAPON5': '0.300', 'weapon4': '0.340', 'HITCOUNT': '0.390', 'WEAPON3': '0.600', 'weapon2': '1.410', 'weapon3': '1.552', 'DAMAGECOUNT': '1.953', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:52,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11195.7, 300 sec: 11218.9). Total num frames: 7557120. Throughput: 0: 1315.0, 1: 1485.1. Samples: 1884278. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:52,460][109198] Avg episode reward: [(0, '-3.260'), (1, '-4.650')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:52,472][63769] DAMAGECOUNT value on done: 2660.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:52,473][63769] Sum rewards: -4.309, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.000', 'AMMO5': '0.005', 'AMMO2': '0.014', 'weapon5': '0.018', 'ARMOR': '0.044', 'AMMO4': '0.068', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.143', 'weapon4': '0.168', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.642', 'WEAPON3': '0.850', 'weapon2': '1.148', 'weapon3': '1.182', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:52,895][63769] DAMAGECOUNT value on done: 3549.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:52,895][63769] Sum rewards: -0.773, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.735', 'ARMOR': '0.004', 'AMMO5': '0.005', 'AMMO2': '0.017', 'WEAPON5': '0.050', 'weapon5': '0.050', 'weapon7': '0.052', 'AMMO4': '0.084', 'AMMO3': '0.088', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON4': '0.150', 'HITCOUNT': '0.260', 'weapon4': '0.266', 'WEAPON3': '0.600', 'weapon3': '1.304', 'weapon2': '1.606', 'DAMAGECOUNT': '1.626', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:53,543][63769] DAMAGECOUNT value on done: 4214.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:53,544][63769] Sum rewards: 0.875, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.620', 'AMMO2': '0.006', 'AMMO5': '0.022', 'AMMO4': '0.032', 'AMMO3': '0.078', 'WEAPON4': '0.150', 'weapon5': '0.248', 'HITCOUNT': '0.310', 'weapon4': '0.394', 'WEAPON5': '0.400', 'ARMOR': '0.451', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon2': '1.096', 'weapon3': '1.660', 'DAMAGECOUNT': '1.848'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:53,878][63770] DAMAGECOUNT value on done: 3835.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:53,878][63770] Sum rewards: -5.856, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.541', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.026', 'AMMO2': '0.030', 'WEAPON1': '0.030', 'ARMOR': '0.036', 'AMMO3': '0.105', 'AMMO4': '0.149', 'weapon5': '0.152', 'HITCOUNT': '0.160', 'weapon4': '0.348', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.429', 'WEAPON5': '0.450', 'WEAPON3': '0.750', 'weapon2': '1.088', 'weapon3': '1.582'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:53,897][63769] DAMAGECOUNT value on done: 2054.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:53,897][63769] Sum rewards: -3.227, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.046', 'AMMO2': '0.001', 'AMMO4': '0.006', 'ARMOR': '0.028', 'HITCOUNT': '0.090', 'AMMO3': '0.114', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.700', 'weapon2': '1.186', 'weapon3': '1.658', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:53,965][63732] Updated weights for policy 0, policy_version 910 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:54,062][63733] Updated weights for policy 1, policy_version 940 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:54,322][63770] DAMAGECOUNT value on done: 2719.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:54,323][63770] Sum rewards: -2.621, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.113', 'AMMO5': '0.005', 'AMMO2': '0.012', 'AMMO4': '0.061', 'AMMO3': '0.071', 'weapon4': '0.074', 'ARMOR': '0.076', 'HITCOUNT': '0.120', 'WEAPON4': '0.150', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.582', 'weapon3': '0.794', 'weapon2': '1.596', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:55,123][63734] DAMAGECOUNT value on done: 2569.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:55,509][63734] DAMAGECOUNT value on done: 2906.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:55,509][63734] Sum rewards: -7.511, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.760', 'AMMO4': '-0.058', 'AMMO2': '-0.011', 'AMMO5': '0.005', 'weapon7': '0.008', 'ARMOR': '0.040', 'HITCOUNT': '0.060', 'AMMO3': '0.128', 'DAMAGECOUNT': '0.165', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.340', 'weapon2': '1.722'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:55,839][63806] DAMAGECOUNT value on done: 3381.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:55,839][63806] Sum rewards: -4.740, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.710', 'AMMO2': '0.017', 'WEAPON4': '0.050', 'ARMOR': '0.053', 'AMMO4': '0.082', 'weapon4': '0.120', 'AMMO3': '0.133', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.336', 'weapon2': '1.554'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:47:56,215][63806] DAMAGECOUNT value on done: 2554.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:57,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11195.7, 300 sec: 11218.9). Total num frames: 7610368. Throughput: 0: 1311.5, 1: 1482.8. Samples: 1901092. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:47:57,460][109198] Avg episode reward: [(0, '-3.243'), (1, '-4.707')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:00,803][63733] Updated weights for policy 1, policy_version 950 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:01,680][63732] Updated weights for policy 0, policy_version 920 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:01,728][63735] DAMAGECOUNT value on done: 3848.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:01,728][63735] Sum rewards: -7.437, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.354', 'AMMO5': '0.005', 'AMMO2': '0.015', 'ARMOR': '0.044', 'AMMO4': '0.072', 'weapon4': '0.082', 'WEAPON5': '0.100', 'WEAPON4': '0.150', 'AMMO3': '0.158', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.134', 'weapon3': '1.672'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:02,059][63735] DAMAGECOUNT value on done: 3431.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:02,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11195.7, 300 sec: 11218.9). Total num frames: 7667712. Throughput: 0: 1312.0, 1: 1484.2. Samples: 1909598. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:02,460][109198] Avg episode reward: [(0, '-3.243'), (1, '-4.692')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:03,972][63805] DAMAGECOUNT value on done: 4167.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:03,973][63805] Sum rewards: -8.040, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-2.000', 'HEALTH': '-1.399', 'AMMO5': '0.011', 'AMMO2': '0.019', 'ARMOR': '0.040', 'AMMO4': '0.093', 'WEAPON4': '0.150', 'HITCOUNT': '0.150', 'weapon4': '0.152', 'AMMO3': '0.155', 'weapon5': '0.216', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.950', 'weapon2': '1.152', 'weapon3': '1.796'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:04,364][63805] DAMAGECOUNT value on done: 3337.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:04,365][63805] Sum rewards: -3.505, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.438', 'AMMO2': '0.017', 'weapon4': '0.032', 'ARMOR': '0.040', 'AMMO4': '0.084', 'WEAPON4': '0.100', 'AMMO3': '0.107', 'HITCOUNT': '0.120', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.216', 'weapon3': '1.402'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:05,508][63770] DAMAGECOUNT value on done: 2962.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:05,509][63770] Sum rewards: -2.714, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.803', 'AMMO5': '0.018', 'AMMO2': '0.028', 'ARMOR': '0.064', 'weapon5': '0.072', 'AMMO3': '0.137', 'AMMO4': '0.140', 'WEAPON4': '0.200', 'weapon4': '0.230', 'WEAPON5': '0.300', 'HITCOUNT': '0.390', 'WEAPON3': '0.850', 'weapon2': '1.022', 'DAMAGECOUNT': '1.380', 'FRAGCOUNT': '2.000', 'weapon3': '2.008'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:05,915][63770] DAMAGECOUNT value on done: 3240.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:06,529][63771] DAMAGECOUNT value on done: 2485.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:06,894][63771] DAMAGECOUNT value on done: 3935.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:07,170][63735] DAMAGECOUNT value on done: 3431.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:07,171][63735] Sum rewards: -6.303, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.476', 'AMMO5': '0.010', 'AMMO2': '0.014', 'ARMOR': '0.040', 'AMMO4': '0.068', 'weapon4': '0.088', 'weapon5': '0.114', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'AMMO3': '0.210', 'HITCOUNT': '0.240', 'DAMAGECOUNT': '0.855', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.200', 'weapon2': '1.200', 'weapon3': '2.084'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:07,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11195.7, 300 sec: 11218.9). Total num frames: 7725056. Throughput: 0: 1319.2, 1: 1475.6. Samples: 1926474. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:07,460][109198] Avg episode reward: [(0, '-3.290'), (1, '-4.695')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:07,603][63735] DAMAGECOUNT value on done: 2528.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:08,090][63733] Updated weights for policy 1, policy_version 960 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:08,346][63767] DAMAGECOUNT value on done: 4479.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:08,347][63767] Sum rewards: -7.117, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.390', 'AMMO5': '0.007', 'AMMO2': '0.019', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'weapon5': '0.068', 'weapon4': '0.090', 'AMMO4': '0.096', 'AMMO3': '0.131', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'DAMAGECOUNT': '0.687', 'WEAPON3': '0.850', 'weapon2': '1.124', 'weapon3': '1.940'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:08,666][63767] DAMAGECOUNT value on done: 4097.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:08,666][63767] Sum rewards: -4.000, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.599', 'AMMO5': '0.007', 'AMMO2': '0.016', 'weapon5': '0.026', 'ARMOR': '0.061', 'AMMO4': '0.081', 'AMMO3': '0.089', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'HITCOUNT': '0.200', 'weapon4': '0.326', 'DAMAGECOUNT': '0.534', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.122', 'weapon2': '1.436'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:09,039][63732] Updated weights for policy 0, policy_version 930 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:09,846][63767] DAMAGECOUNT value on done: 4755.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:09,847][63767] Sum rewards: -3.036, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.566', 'AMMO5': '0.007', 'weapon5': '0.018', 'AMMO2': '0.021', 'ARMOR': '0.036', 'weapon4': '0.038', 'AMMO3': '0.082', 'AMMO4': '0.104', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.720', 'weapon3': '1.390', 'weapon2': '1.664', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:10,189][63767] DAMAGECOUNT value on done: 4895.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:10,190][63767] Sum rewards: -1.612, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.950', 'AMMO5': '0.012', 'AMMO2': '0.015', 'ARMOR': '0.036', 'weapon4': '0.056', 'weapon5': '0.062', 'AMMO4': '0.072', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'AMMO3': '0.162', 'HITCOUNT': '0.320', 'WEAPON3': '0.950', 'weapon2': '1.282', 'DAMAGECOUNT': '1.341', 'weapon3': '2.030', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:12,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11264.0, 300 sec: 11205.0). Total num frames: 7782400. Throughput: 0: 1320.4, 1: 1472.2. Samples: 1943198. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:12,460][109198] Avg episode reward: [(0, '-3.221'), (1, '-4.702')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:12,462][63454] Saving new best policy, reward=-3.221!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:13,173][63806] DAMAGECOUNT value on done: 3695.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:13,173][63806] Sum rewards: -3.769, reward structure: {'DEATHCOUNT': '-9.750', 'AMMO2': '0.004', 'AMMO4': '0.021', 'HEALTH': '0.022', 'ARMOR': '0.028', 'AMMO3': '0.130', 'HITCOUNT': '0.270', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.930', 'FRAGCOUNT': '1.000', 'weapon2': '1.252', 'weapon3': '1.624'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:13,363][63734] DAMAGECOUNT value on done: 4318.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:13,364][63734] Sum rewards: -4.632, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.915', 'WEAPON1': '0.010', 'AMMO2': '0.013', 'AMMO5': '0.015', 'ARMOR': '0.032', 'weapon4': '0.062', 'AMMO4': '0.065', 'AMMO3': '0.140', 'WEAPON4': '0.150', 'weapon5': '0.168', 'HITCOUNT': '0.250', 'WEAPON5': '0.300', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.915', 'FRAGCOUNT': '1.000', 'weapon3': '1.432', 'weapon2': '1.480'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:13,508][63806] DAMAGECOUNT value on done: 4060.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:13,509][63806] Sum rewards: -8.030, reward structure: {'DEATHCOUNT': '-11.250', 'FRAGCOUNT': '-2.000', 'HEALTH': '-0.190', 'AMMO5': '0.007', 'ARMOR': '0.024', 'AMMO2': '0.039', 'weapon5': '0.052', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'weapon4': '0.102', 'AMMO3': '0.126', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'AMMO4': '0.192', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.681', 'weapon3': '1.246', 'weapon2': '1.520'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:13,735][63734] DAMAGECOUNT value on done: 2663.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:13,736][63734] Sum rewards: 1.661, reward structure: {'DEATHCOUNT': '-4.500', 'weapon5': '0.002', 'AMMO5': '0.005', 'AMMO2': '0.007', 'AMMO4': '0.036', 'weapon7': '0.042', 'WEAPON5': '0.050', 'AMMO3': '0.080', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'HITCOUNT': '0.120', 'WEAPON3': '0.300', 'ARMOR': '0.500', 'DAMAGECOUNT': '0.624', 'HEALTH': '0.710', 'weapon3': '0.958', 'FRAGCOUNT': '1.000', 'weapon2': '1.426'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:14,301][63805] DAMAGECOUNT value on done: 4019.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:14,302][63805] Sum rewards: -0.273, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.468', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'AMMO5': '0.003', 'weapon4': '0.046', 'WEAPON4': '0.050', 'weapon5': '0.050', 'AMMO3': '0.093', 'WEAPON5': '0.100', 'HITCOUNT': '0.200', 'WEAPON3': '0.350', 'FRAGCOUNT': '0.500', 'ARMOR': '0.512', 'DAMAGECOUNT': '0.981', 'weapon2': '1.132', 'weapon3': '1.442'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:14,653][63805] DAMAGECOUNT value on done: 4733.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:14,654][63805] Sum rewards: -0.854, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.560', 'AMMO2': '0.003', 'AMMO4': '0.013', 'weapon4': '0.032', 'WEAPON4': '0.050', 'weapon7': '0.070', 'AMMO3': '0.116', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'HITCOUNT': '0.230', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.140', 'weapon2': '1.314', 'weapon3': '1.548'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:14,834][63733] Updated weights for policy 1, policy_version 970 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:15,834][63771] DAMAGECOUNT value on done: 3952.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:15,835][63771] Sum rewards: 3.371, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.354', 'AMMO2': '0.003', 'ARMOR': '0.012', 'AMMO4': '0.014', 'AMMO5': '0.016', 'weapon5': '0.094', 'weapon4': '0.100', 'WEAPON4': '0.150', 'AMMO3': '0.196', 'WEAPON5': '0.200', 'HITCOUNT': '0.260', 'WEAPON3': '0.900', 'weapon3': '1.412', 'DAMAGECOUNT': '1.731', 'weapon2': '1.886', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:16,231][63771] DAMAGECOUNT value on done: 2792.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:16,232][63771] Sum rewards: -5.265, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.350', 'AMMO2': '0.002', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO4': '0.012', 'WEAPON5': '0.100', 'AMMO3': '0.160', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.513', 'ARMOR': '0.515', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.514', 'weapon2': '1.538'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:17,437][63732] Updated weights for policy 0, policy_version 940 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:17,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11195.7, 300 sec: 11205.0). Total num frames: 7839744. Throughput: 0: 1316.3, 1: 1483.8. Samples: 1951651. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:17,460][109198] Avg episode reward: [(0, '-3.068'), (1, '-4.605')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:17,465][63454] Saving new best policy, reward=-3.068!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:17,555][63769] DAMAGECOUNT value on done: 2885.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:17,555][63769] Sum rewards: -5.274, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.390', 'AMMO5': '0.003', 'weapon5': '0.004', 'AMMO2': '0.019', 'WEAPON5': '0.050', 'AMMO4': '0.097', 'WEAPON4': '0.100', 'AMMO3': '0.118', 'HITCOUNT': '0.170', 'weapon4': '0.190', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.675', 'weapon3': '1.242', 'FRAGCOUNT': '1.500', 'weapon2': '1.548'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:17,898][63769] DAMAGECOUNT value on done: 3943.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:17,899][63769] Sum rewards: 0.716, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.820', 'AMMO5': '0.008', 'AMMO2': '0.024', 'weapon5': '0.078', 'weapon4': '0.094', 'ARMOR': '0.100', 'AMMO3': '0.111', 'AMMO4': '0.121', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'HITCOUNT': '0.210', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.182', 'weapon3': '1.478', 'weapon2': '1.630', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:18,196][63806] DAMAGECOUNT value on done: 3461.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:18,362][63734] DAMAGECOUNT value on done: 2894.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:18,362][63734] Sum rewards: -5.386, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.300', 'AMMO5': '0.010', 'AMMO2': '0.016', 'weapon5': '0.018', 'WEAPON1': '0.020', 'weapon4': '0.052', 'ARMOR': '0.072', 'AMMO4': '0.082', 'WEAPON4': '0.100', 'AMMO3': '0.133', 'WEAPON5': '0.150', 'HITCOUNT': '0.200', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.975', 'weapon2': '1.346', 'weapon3': '1.440', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:18,610][63769] DAMAGECOUNT value on done: 4339.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:18,610][63769] Sum rewards: -2.514, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-2.177', 'AMMO4': '-0.024', 'AMMO2': '-0.005', 'AMMO5': '0.017', 'ARMOR': '0.080', 'weapon5': '0.096', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'HITCOUNT': '0.150', 'weapon4': '0.248', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.650', 'weapon2': '0.974', 'FRAGCOUNT': '1.000', 'weapon3': '1.590'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:18,654][63806] DAMAGECOUNT value on done: 2850.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:18,655][63806] Sum rewards: -2.754, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.582', 'AMMO5': '0.005', 'AMMO2': '0.011', 'AMMO4': '0.055', 'AMMO3': '0.095', 'ARMOR': '0.100', 'weapon4': '0.124', 'WEAPON4': '0.150', 'HITCOUNT': '0.180', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.888', 'weapon2': '1.022', 'weapon3': '1.748', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:18,757][63734] DAMAGECOUNT value on done: 2996.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:18,950][63769] DAMAGECOUNT value on done: 2169.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:18,951][63769] Sum rewards: -2.216, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.654', 'weapon5': '0.002', 'AMMO5': '0.007', 'AMMO2': '0.019', 'WEAPON5': '0.050', 'AMMO3': '0.068', 'ARMOR': '0.084', 'HITCOUNT': '0.090', 'AMMO4': '0.096', 'WEAPON4': '0.200', 'weapon4': '0.258', 'DAMAGECOUNT': '0.345', 'WEAPON3': '0.350', 'weapon3': '0.682', 'FRAGCOUNT': '1.000', 'weapon2': '1.936'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:19,226][63770] DAMAGECOUNT value on done: 4056.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:19,227][63770] Sum rewards: 1.409, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.170', 'AMMO2': '0.006', 'AMMO5': '0.020', 'AMMO4': '0.027', 'weapon7': '0.086', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.109', 'weapon4': '0.124', 'WEAPON4': '0.150', 'HITCOUNT': '0.180', 'weapon5': '0.302', 'WEAPON5': '0.400', 'ARMOR': '0.471', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.663', 'weapon2': '1.210', 'weapon3': '1.630', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:19,621][63770] DAMAGECOUNT value on done: 2844.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:21,295][63733] Updated weights for policy 1, policy_version 980 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:22,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11195.7, 300 sec: 11191.1). Total num frames: 7892992. Throughput: 0: 1302.1, 1: 1493.9. Samples: 1968190. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:22,460][109198] Avg episode reward: [(0, '-2.890'), (1, '-4.678')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:22,461][63454] Saving new best policy, reward=-2.890!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:25,430][63732] Updated weights for policy 0, policy_version 950 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:26,347][63735] DAMAGECOUNT value on done: 4008.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:26,732][63735] DAMAGECOUNT value on done: 3848.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:26,733][63735] Sum rewards: -6.519, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-1.910', 'AMMO5': '0.013', 'AMMO2': '0.019', 'weapon4': '0.030', 'weapon5': '0.050', 'AMMO4': '0.095', 'WEAPON5': '0.150', 'AMMO3': '0.186', 'WEAPON4': '0.200', 'HITCOUNT': '0.330', 'WEAPON3': '1.100', 'weapon2': '1.154', 'DAMAGECOUNT': '1.251', 'weapon3': '2.064', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:27,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11195.7, 300 sec: 11191.1). Total num frames: 7950336. Throughput: 0: 1302.2, 1: 1493.6. Samples: 1985050. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:27,460][109198] Avg episode reward: [(0, '-2.883'), (1, '-4.724')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:27,467][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000989_4050944.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:27,468][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000952_3899392.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:27,526][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000638_2613248.pth\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:27,527][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000652_2670592.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:27,533][63454] Saving new best policy, reward=-2.883!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:28,146][63733] Updated weights for policy 1, policy_version 990 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:28,928][63805] DAMAGECOUNT value on done: 4529.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:28,929][63805] Sum rewards: 0.758, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.628', 'AMMO5': '0.005', 'ARMOR': '0.020', 'AMMO2': '0.023', 'weapon4': '0.036', 'AMMO4': '0.114', 'AMMO3': '0.120', 'WEAPON4': '0.200', 'HITCOUNT': '0.230', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.086', 'weapon2': '1.412', 'weapon3': '1.740', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:29,326][63805] DAMAGECOUNT value on done: 3509.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:29,327][63805] Sum rewards: -6.323, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.678', 'weapon5': '0.002', 'AMMO5': '0.007', 'ARMOR': '0.012', 'AMMO2': '0.015', 'WEAPON1': '0.030', 'AMMO4': '0.076', 'AMMO3': '0.106', 'HITCOUNT': '0.130', 'WEAPON5': '0.150', 'weapon4': '0.176', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.516', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.204', 'weapon3': '1.780'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:29,628][63771] DAMAGECOUNT value on done: 2575.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:29,629][63771] Sum rewards: -6.100, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.914', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'AMMO2': '0.006', 'WEAPON1': '0.010', 'ARMOR': '0.012', 'AMMO4': '0.030', 'WEAPON4': '0.050', 'HITCOUNT': '0.070', 'AMMO3': '0.080', 'weapon5': '0.088', 'weapon7': '0.088', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.102', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.500', 'weapon3': '1.196', 'weapon2': '1.406'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:29,979][63771] DAMAGECOUNT value on done: 4026.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:29,979][63771] Sum rewards: 0.286, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.564', 'AMMO2': '0.011', 'AMMO4': '0.056', 'AMMO3': '0.081', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'weapon4': '0.184', 'DAMAGECOUNT': '0.273', 'WEAPON3': '0.450', 'ARMOR': '0.508', 'weapon3': '0.826', 'weapon2': '1.520', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:30,638][63767] DAMAGECOUNT value on done: 4629.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:30,639][63767] Sum rewards: -2.764, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.794', 'AMMO2': '0.005', 'AMMO4': '0.025', 'weapon4': '0.082', 'HITCOUNT': '0.100', 'ARMOR': '0.108', 'AMMO3': '0.123', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.750', 'weapon3': '1.554', 'weapon2': '1.682', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:30,839][63770] DAMAGECOUNT value on done: 3157.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:30,840][63770] Sum rewards: -2.833, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.950', 'AMMO5': '0.007', 'AMMO2': '0.047', 'ARMOR': '0.056', 'AMMO3': '0.094', 'WEAPON5': '0.100', 'HITCOUNT': '0.150', 'AMMO4': '0.235', 'weapon4': '0.388', 'WEAPON4': '0.400', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.585', 'FRAGCOUNT': '1.000', 'weapon3': '1.166', 'weapon2': '1.638'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:31,014][63767] DAMAGECOUNT value on done: 4247.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:31,015][63767] Sum rewards: -3.789, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.446', 'AMMO5': '0.010', 'ARMOR': '0.040', 'AMMO2': '0.042', 'weapon5': '0.100', 'AMMO3': '0.116', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'weapon4': '0.206', 'AMMO4': '0.212', 'WEAPON4': '0.450', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.106', 'weapon3': '1.284'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:31,224][63770] DAMAGECOUNT value on done: 3565.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:31,225][63770] Sum rewards: -5.436, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.449', 'AMMO4': '-0.041', 'AMMO2': '-0.008', 'AMMO3': '0.193', 'HITCOUNT': '0.210', 'WEAPON3': '0.950', 'DAMAGECOUNT': '0.975', 'weapon3': '1.392', 'weapon2': '1.592', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:31,837][63735] DAMAGECOUNT value on done: 3628.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:31,838][63735] Sum rewards: -5.076, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.840', 'AMMO4': '-0.004', 'AMMO2': '-0.001', 'AMMO5': '0.011', 'weapon4': '0.016', 'ARMOR': '0.059', 'WEAPON4': '0.150', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'weapon5': '0.150', 'AMMO3': '0.155', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.591', 'WEAPON3': '0.750', 'weapon3': '1.212', 'weapon2': '1.874'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:32,176][63735] DAMAGECOUNT value on done: 2578.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:32,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11264.0, 300 sec: 11191.1). Total num frames: 8007680. Throughput: 0: 1300.5, 1: 1490.6. Samples: 1993345. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:32,460][109198] Avg episode reward: [(0, '-3.004'), (1, '-4.679')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:32,665][63767] DAMAGECOUNT value on done: 4955.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:32,665][63767] Sum rewards: -1.507, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.065', 'AMMO2': '0.010', 'AMMO4': '0.048', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO3': '0.136', 'HITCOUNT': '0.140', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.750', 'weapon2': '1.236', 'weapon3': '1.774', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:33,026][63732] Updated weights for policy 0, policy_version 960 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:33,060][63767] DAMAGECOUNT value on done: 4905.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:35,038][63733] Updated weights for policy 1, policy_version 1000 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:36,980][63806] DAMAGECOUNT value on done: 3785.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:36,981][63806] Sum rewards: -8.826, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-3.172', 'AMMO4': '-0.008', 'AMMO2': '-0.002', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'AMMO3': '0.178', 'weapon4': '0.180', 'DAMAGECOUNT': '0.270', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.266', 'weapon2': '1.478'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:37,437][63806] DAMAGECOUNT value on done: 4426.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:37,437][63806] Sum rewards: -0.857, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.350', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.020', 'ARMOR': '0.040', 'AMMO3': '0.100', 'weapon5': '0.114', 'WEAPON4': '0.200', 'HITCOUNT': '0.250', 'WEAPON5': '0.300', 'weapon4': '0.464', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.098', 'weapon2': '1.166', 'weapon3': '1.636', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:37,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11264.0, 300 sec: 11177.2). Total num frames: 8060928. Throughput: 0: 1305.0, 1: 1494.1. Samples: 2010239. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:37,460][109198] Avg episode reward: [(0, '-2.943'), (1, '-4.653')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:38,410][63734] DAMAGECOUNT value on done: 4623.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:38,411][63734] Sum rewards: -2.825, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.725', 'AMMO5': '0.009', 'AMMO2': '0.021', 'ARMOR': '0.068', 'weapon5': '0.082', 'WEAPON4': '0.100', 'AMMO4': '0.107', 'AMMO3': '0.125', 'WEAPON5': '0.250', 'weapon4': '0.254', 'HITCOUNT': '0.290', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.915', 'weapon2': '1.302', 'weapon3': '1.426', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:38,855][63734] DAMAGECOUNT value on done: 3031.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:38,856][63734] Sum rewards: -3.967, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.320', 'AMMO5': '0.003', 'AMMO2': '0.011', 'WEAPON5': '0.050', 'AMMO4': '0.053', 'ARMOR': '0.060', 'weapon5': '0.064', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'HITCOUNT': '0.160', 'weapon4': '0.198', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.650', 'weapon3': '1.000', 'DAMAGECOUNT': '1.104', 'weapon2': '1.538'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:39,082][63805] DAMAGECOUNT value on done: 4129.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:39,083][63805] Sum rewards: -3.305, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.150', 'AMMO5': '0.007', 'AMMO2': '0.022', 'AMMO3': '0.072', 'HITCOUNT': '0.080', 'AMMO4': '0.108', 'weapon5': '0.112', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.330', 'WEAPON4': '0.350', 'WEAPON3': '0.450', 'weapon4': '0.470', 'weapon3': '0.924', 'FRAGCOUNT': '1.000', 'weapon2': '1.220'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:39,545][63805] DAMAGECOUNT value on done: 4978.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:39,546][63805] Sum rewards: -6.231, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.452', 'weapon4': '0.012', 'AMMO2': '0.013', 'WEAPON4': '0.050', 'AMMO4': '0.067', 'ARMOR': '0.083', 'HITCOUNT': '0.170', 'AMMO3': '0.179', 'DAMAGECOUNT': '0.735', 'WEAPON3': '0.900', 'weapon3': '1.124', 'weapon2': '1.888', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:40,295][63806] DAMAGECOUNT value on done: 3814.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:40,296][63806] Sum rewards: -1.961, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.470', 'AMMO4': '-0.028', 'AMMO2': '-0.005', 'AMMO5': '0.016', 'weapon7': '0.050', 'weapon5': '0.112', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.131', 'WEAPON7': '0.200', 'HITCOUNT': '0.250', 'WEAPON5': '0.300', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.059', 'weapon2': '1.314', 'weapon3': '1.420', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:40,507][63771] DAMAGECOUNT value on done: 4250.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:40,507][63771] Sum rewards: -6.943, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.242', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'AMMO5': '0.024', 'weapon4': '0.026', 'AMMO4': '0.041', 'WEAPON4': '0.100', 'weapon5': '0.158', 'AMMO3': '0.178', 'HITCOUNT': '0.180', 'WEAPON5': '0.350', 'ARMOR': '0.496', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.810', 'WEAPON3': '0.950', 'weapon2': '1.408', 'weapon3': '1.810'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:40,620][63806] DAMAGECOUNT value on done: 3149.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:40,621][63806] Sum rewards: 0.231, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.636', 'AMMO2': '0.004', 'AMMO5': '0.007', 'ARMOR': '0.012', 'AMMO4': '0.022', 'weapon5': '0.034', 'weapon7': '0.048', 'WEAPON5': '0.050', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.142', 'WEAPON4': '0.150', 'HITCOUNT': '0.190', 'WEAPON7': '0.200', 'weapon4': '0.208', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.897', 'weapon3': '1.286', 'weapon2': '1.676', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:40,935][63771] DAMAGECOUNT value on done: 2930.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:41,004][63732] Updated weights for policy 0, policy_version 970 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:41,775][63734] DAMAGECOUNT value on done: 3254.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:41,776][63734] Sum rewards: -5.147, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.384', 'AMMO5': '0.003', 'ARMOR': '0.004', 'AMMO2': '0.021', 'WEAPON5': '0.050', 'AMMO3': '0.097', 'AMMO4': '0.106', 'weapon4': '0.136', 'WEAPON4': '0.200', 'HITCOUNT': '0.270', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.080', 'weapon3': '1.218', 'weapon2': '1.702', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:42,090][63733] Updated weights for policy 1, policy_version 1010 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:42,203][63734] DAMAGECOUNT value on done: 3086.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:42,458][109198] Fps is (10 sec: 10649.6, 60 sec: 11127.5, 300 sec: 11149.5). Total num frames: 8114176. Throughput: 0: 1303.0, 1: 1486.9. Samples: 2026638. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:42,460][109198] Avg episode reward: [(0, '-2.944'), (1, '-4.735')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:42,673][63769] DAMAGECOUNT value on done: 3140.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:42,674][63769] Sum rewards: -1.812, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.676', 'AMMO2': '0.008', 'AMMO5': '0.012', 'weapon5': '0.024', 'AMMO4': '0.040', 'WEAPON4': '0.050', 'ARMOR': '0.052', 'AMMO3': '0.064', 'WEAPON5': '0.150', 'HITCOUNT': '0.240', 'weapon4': '0.326', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.765', 'FRAGCOUNT': '1.000', 'weapon3': '1.202', 'weapon2': '1.330'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:43,066][63769] DAMAGECOUNT value on done: 4512.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:43,066][63769] Sum rewards: -5.806, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-2.500', 'HEALTH': '-1.646', 'WEAPON1': '0.010', 'AMMO5': '0.018', 'AMMO2': '0.032', 'AMMO3': '0.120', 'AMMO4': '0.159', 'weapon5': '0.176', 'weapon4': '0.280', 'WEAPON4': '0.300', 'HITCOUNT': '0.310', 'WEAPON5': '0.450', 'ARMOR': '0.470', 'WEAPON3': '0.700', 'weapon2': '1.166', 'weapon3': '1.442', 'DAMAGECOUNT': '1.707'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:43,742][63769] DAMAGECOUNT value on done: 4596.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:43,743][63769] Sum rewards: -1.759, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.200', 'weapon7': '0.002', 'AMMO5': '0.008', 'ARMOR': '0.008', 'AMMO2': '0.032', 'weapon5': '0.062', 'AMMO3': '0.122', 'AMMO4': '0.162', 'WEAPON5': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.200', 'weapon4': '0.230', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.771', 'WEAPON3': '0.800', 'weapon3': '1.140', 'weapon2': '1.254', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:44,146][63769] DAMAGECOUNT value on done: 2279.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:44,147][63769] Sum rewards: -2.930, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.630', 'AMMO5': '0.005', 'AMMO2': '0.015', 'ARMOR': '0.020', 'WEAPON1': '0.020', 'AMMO4': '0.074', 'WEAPON5': '0.100', 'HITCOUNT': '0.120', 'AMMO3': '0.130', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.330', 'weapon4': '0.436', 'WEAPON3': '0.700', 'weapon2': '1.160', 'weapon3': '1.440', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:44,511][63770] DAMAGECOUNT value on done: 4396.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:44,511][63770] Sum rewards: 0.448, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.498', 'AMMO5': '0.007', 'AMMO2': '0.028', 'ARMOR': '0.040', 'AMMO3': '0.100', 'weapon5': '0.126', 'HITCOUNT': '0.140', 'AMMO4': '0.142', 'WEAPON5': '0.150', 'WEAPON4': '0.250', 'weapon4': '0.286', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.020', 'weapon3': '1.250', 'weapon2': '1.306', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:44,912][63770] DAMAGECOUNT value on done: 2874.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:47,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11195.7, 300 sec: 11163.3). Total num frames: 8171520. Throughput: 0: 1312.7, 1: 1469.1. Samples: 2034778. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:47,460][109198] Avg episode reward: [(0, '-2.842'), (1, '-4.720')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:47,467][63454] Saving new best policy, reward=-2.842!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:47,884][63732] Updated weights for policy 0, policy_version 980 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:50,406][63733] Updated weights for policy 1, policy_version 1020 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:50,895][63735] DAMAGECOUNT value on done: 4358.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:50,895][63735] Sum rewards: 0.050, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.528', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.060', 'AMMO4': '0.092', 'AMMO3': '0.150', 'WEAPON4': '0.150', 'weapon4': '0.244', 'HITCOUNT': '0.270', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.050', 'weapon2': '1.316', 'weapon3': '1.608', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:51,238][63735] DAMAGECOUNT value on done: 4068.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:51,239][63735] Sum rewards: -3.464, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.483', 'AMMO2': '0.025', 'AMMO3': '0.066', 'AMMO4': '0.122', 'weapon4': '0.144', 'HITCOUNT': '0.180', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.660', 'weapon3': '1.014', 'weapon2': '1.858', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:51,417][63770] Large shaping reward -2.519 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.27, -90.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:52,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11195.7, 300 sec: 11163.3). Total num frames: 8228864. Throughput: 0: 1338.1, 1: 1442.2. Samples: 2051587. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:52,460][109198] Avg episode reward: [(0, '-2.817'), (1, '-4.675')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:52,461][63454] Saving new best policy, reward=-2.817!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:52,670][63771] DAMAGECOUNT value on done: 2660.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:52,671][63771] Sum rewards: -4.367, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.428', 'WEAPON1': '0.010', 'AMMO5': '0.013', 'AMMO2': '0.020', 'weapon5': '0.056', 'HITCOUNT': '0.070', 'ARMOR': '0.080', 'AMMO4': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.115', 'weapon4': '0.154', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.600', 'weapon3': '0.918', 'FRAGCOUNT': '1.000', 'weapon2': '1.570'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:53,055][63771] DAMAGECOUNT value on done: 4151.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:53,056][63771] Sum rewards: -5.226, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.367', 'weapon5': '0.008', 'WEAPON1': '0.010', 'AMMO5': '0.010', 'AMMO2': '0.012', 'weapon4': '0.048', 'ARMOR': '0.056', 'AMMO4': '0.057', 'WEAPON5': '0.100', 'AMMO3': '0.125', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.426', 'weapon3': '1.684'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:53,289][63767] DAMAGECOUNT value on done: 5181.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:53,289][63767] Sum rewards: -0.346, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.994', 'AMMO5': '0.010', 'AMMO2': '0.026', 'weapon4': '0.098', 'AMMO3': '0.109', 'AMMO4': '0.130', 'WEAPON5': '0.150', 'weapon5': '0.224', 'WEAPON4': '0.250', 'HITCOUNT': '0.270', 'WEAPON3': '0.500', 'weapon3': '1.410', 'weapon2': '1.564', 'DAMAGECOUNT': '1.656', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:53,619][63767] DAMAGECOUNT value on done: 4465.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:53,777][63805] DAMAGECOUNT value on done: 5024.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:53,778][63805] Sum rewards: 0.406, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.483', 'AMMO2': '0.005', 'AMMO5': '0.017', 'ARMOR': '0.024', 'AMMO4': '0.025', 'weapon5': '0.060', 'WEAPON4': '0.150', 'AMMO3': '0.170', 'WEAPON5': '0.300', 'weapon4': '0.362', 'HITCOUNT': '0.390', 'WEAPON3': '0.950', 'weapon2': '1.294', 'DAMAGECOUNT': '1.485', 'weapon3': '1.656', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:54,109][63805] DAMAGECOUNT value on done: 3660.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:54,109][63805] Sum rewards: -2.133, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO2': '0.016', 'ARMOR': '0.040', 'AMMO4': '0.078', 'WEAPON4': '0.100', 'weapon4': '0.144', 'AMMO3': '0.150', 'HITCOUNT': '0.190', 'HEALTH': '0.272', 'DAMAGECOUNT': '0.453', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.362', 'weapon3': '1.612'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:54,408][63732] Updated weights for policy 0, policy_version 990 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:55,043][63767] DAMAGECOUNT value on done: 5315.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:55,044][63767] Sum rewards: 0.569, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.057', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.018', 'AMMO4': '0.091', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.135', 'HITCOUNT': '0.230', 'weapon4': '0.290', 'ARMOR': '0.504', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.080', 'weapon2': '1.240', 'weapon3': '1.374', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:55,399][63767] DAMAGECOUNT value on done: 5102.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:55,400][63767] Sum rewards: -7.395, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.819', 'AMMO2': '0.004', 'AMMO5': '0.007', 'AMMO4': '0.019', 'WEAPON1': '0.020', 'ARMOR': '0.044', 'weapon4': '0.100', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'HITCOUNT': '0.160', 'AMMO3': '0.201', 'DAMAGECOUNT': '0.591', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon3': '1.572', 'weapon2': '1.606'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:56,109][63770] DAMAGECOUNT value on done: 3706.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:56,110][63770] Sum rewards: 1.289, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.375', 'AMMO4': '-0.029', 'AMMO2': '-0.006', 'AMMO5': '0.005', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.112', 'AMMO3': '0.179', 'HITCOUNT': '0.450', 'ARMOR': '0.516', 'WEAPON3': '1.150', 'weapon2': '1.512', 'DAMAGECOUNT': '1.647', 'weapon3': '1.928', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:56,436][63735] DAMAGECOUNT value on done: 4082.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:56,436][63735] Sum rewards: -6.966, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-2.250', 'AMMO4': '-0.056', 'AMMO2': '-0.011', 'AMMO5': '0.015', 'weapon5': '0.158', 'AMMO3': '0.192', 'HITCOUNT': '0.280', 'WEAPON5': '0.350', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.362', 'weapon3': '1.720', 'weapon2': '1.774', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:56,497][63770] DAMAGECOUNT value on done: 3650.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:56,497][63770] Sum rewards: -5.989, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-2.000', 'HEALTH': '-1.030', 'AMMO2': '0.006', 'AMMO5': '0.007', 'AMMO4': '0.029', 'weapon5': '0.036', 'ARMOR': '0.040', 'HITCOUNT': '0.080', 'WEAPON5': '0.100', 'AMMO3': '0.115', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.750', 'weapon2': '1.386', 'weapon3': '1.736'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:56,760][63735] DAMAGECOUNT value on done: 2833.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:56,760][63735] Sum rewards: -5.781, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.990', 'AMMO5': '0.003', 'weapon5': '0.010', 'AMMO2': '0.030', 'WEAPON5': '0.050', 'ARMOR': '0.080', 'AMMO4': '0.149', 'AMMO3': '0.149', 'HITCOUNT': '0.170', 'weapon4': '0.204', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.765', 'WEAPON3': '0.850', 'weapon3': '1.096', 'weapon2': '1.554', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:57,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11195.7, 300 sec: 11149.4). Total num frames: 8282112. Throughput: 0: 1366.2, 1: 1413.0. Samples: 2068264. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:48:57,460][109198] Avg episode reward: [(0, '-2.844'), (1, '-4.705')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:48:58,613][63733] Updated weights for policy 1, policy_version 1030 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:00,921][63732] Updated weights for policy 0, policy_version 1000 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:01,569][63806] DAMAGECOUNT value on done: 3879.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:01,570][63806] Sum rewards: -10.279, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.245', 'AMMO2': '0.002', 'AMMO5': '0.009', 'AMMO4': '0.011', 'WEAPON1': '0.020', 'HITCOUNT': '0.080', 'AMMO3': '0.143', 'weapon5': '0.146', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.282', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.220', 'weapon2': '1.602'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:01,960][63806] DAMAGECOUNT value on done: 5001.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:01,960][63806] Sum rewards: -1.918, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.400', 'AMMO5': '0.012', 'AMMO2': '0.033', 'ARMOR': '0.068', 'weapon5': '0.072', 'weapon4': '0.146', 'WEAPON5': '0.150', 'AMMO4': '0.166', 'AMMO3': '0.173', 'WEAPON4': '0.250', 'HITCOUNT': '0.420', 'WEAPON3': '0.700', 'weapon3': '1.448', 'DAMAGECOUNT': '1.725', 'weapon2': '1.868', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:02,459][109198] Fps is (10 sec: 11058.9, 60 sec: 11195.7, 300 sec: 11149.4). Total num frames: 8339456. Throughput: 0: 1391.8, 1: 1385.6. Samples: 2076634. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:02,460][109198] Avg episode reward: [(0, '-2.849'), (1, '-4.733')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:03,138][63806] DAMAGECOUNT value on done: 3988.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:03,138][63806] Sum rewards: -2.667, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.708', 'AMMO2': '0.003', 'AMMO5': '0.007', 'ARMOR': '0.016', 'AMMO4': '0.016', 'WEAPON4': '0.050', 'weapon4': '0.056', 'weapon5': '0.060', 'AMMO3': '0.150', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.522', 'WEAPON3': '0.900', 'weapon3': '1.520', 'weapon2': '1.620', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:03,530][63806] DAMAGECOUNT value on done: 3540.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:03,531][63806] Sum rewards: -9.551, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-3.276', 'AMMO5': '0.014', 'AMMO2': '0.022', 'weapon4': '0.032', 'AMMO4': '0.109', 'weapon5': '0.144', 'WEAPON4': '0.250', 'AMMO3': '0.251', 'HITCOUNT': '0.340', 'WEAPON5': '0.350', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '1.173', 'WEAPON3': '1.300', 'weapon2': '1.492', 'weapon3': '1.998'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:03,553][63734] DAMAGECOUNT value on done: 5161.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:03,553][63734] Sum rewards: 1.057, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.424', 'AMMO2': '0.011', 'AMMO5': '0.034', 'AMMO4': '0.057', 'weapon4': '0.080', 'AMMO3': '0.136', 'WEAPON4': '0.150', 'weapon5': '0.300', 'HITCOUNT': '0.360', 'WEAPON5': '0.500', 'WEAPON3': '0.900', 'weapon2': '1.238', 'DAMAGECOUNT': '1.614', 'weapon3': '1.850', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:03,941][63734] DAMAGECOUNT value on done: 3101.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:04,063][63805] DAMAGECOUNT value on done: 4789.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:04,063][63805] Sum rewards: 0.433, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.590', 'AMMO5': '0.007', 'AMMO2': '0.023', 'ARMOR': '0.024', 'weapon5': '0.108', 'AMMO4': '0.114', 'weapon4': '0.188', 'AMMO3': '0.192', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'HITCOUNT': '0.350', 'weapon2': '0.716', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.980', 'weapon3': '2.220', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:04,533][63805] DAMAGECOUNT value on done: 5018.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:05,251][63734] DAMAGECOUNT value on done: 3460.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:05,251][63734] Sum rewards: -10.016, reward structure: {'DEATHCOUNT': '-12.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.250', 'AMMO5': '0.010', 'AMMO2': '0.023', 'ARMOR': '0.044', 'HITCOUNT': '0.080', 'weapon4': '0.098', 'AMMO4': '0.115', 'AMMO3': '0.151', 'weapon5': '0.170', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.618', 'WEAPON3': '0.800', 'weapon3': '1.322', 'weapon2': '1.652'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:05,435][63771] DAMAGECOUNT value on done: 4874.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:05,435][63771] Sum rewards: 1.355, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.758', 'AMMO2': '0.005', 'AMMO5': '0.015', 'AMMO4': '0.026', 'WEAPON4': '0.050', 'weapon4': '0.104', 'AMMO3': '0.162', 'weapon5': '0.192', 'WEAPON5': '0.200', 'HITCOUNT': '0.300', 'ARMOR': '0.454', 'WEAPON3': '0.850', 'weapon2': '1.596', 'weapon3': '1.786', 'DAMAGECOUNT': '1.872', 'FRAGCOUNT': '3.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:05,628][63734] DAMAGECOUNT value on done: 3260.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:05,628][63734] Sum rewards: -2.303, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.415', 'AMMO2': '0.003', 'AMMO4': '0.016', 'weapon7': '0.078', 'AMMO3': '0.101', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.150', 'HITCOUNT': '0.160', 'weapon4': '0.188', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.522', 'WEAPON3': '0.550', 'weapon3': '0.960', 'FRAGCOUNT': '1.000', 'weapon2': '1.694'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:05,872][63771] DAMAGECOUNT value on done: 3075.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:05,872][63771] Sum rewards: -2.566, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.676', 'AMMO2': '0.003', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO4': '0.013', 'weapon5': '0.034', 'AMMO3': '0.089', 'HITCOUNT': '0.130', 'WEAPON5': '0.150', 'ARMOR': '0.424', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.600', 'weapon3': '1.294', 'weapon2': '1.420', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:07,011][63733] Updated weights for policy 1, policy_version 1040 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:07,332][63769] DAMAGECOUNT value on done: 5031.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:07,333][63769] Sum rewards: -2.924, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.585', 'AMMO2': '0.013', 'AMMO4': '0.064', 'AMMO3': '0.180', 'WEAPON4': '0.200', 'weapon4': '0.266', 'HITCOUNT': '0.290', 'ARMOR': '0.483', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.305', 'weapon2': '1.630', 'weapon3': '1.630', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:07,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11127.5, 300 sec: 11135.6). Total num frames: 8392704. Throughput: 0: 1438.7, 1: 1340.0. Samples: 2093233. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:07,460][109198] Avg episode reward: [(0, '-2.753'), (1, '-4.718')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:07,467][63454] Saving new best policy, reward=-2.753!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:07,615][63732] Updated weights for policy 0, policy_version 1010 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:07,724][63769] DAMAGECOUNT value on done: 2590.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:07,725][63769] Sum rewards: -0.638, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.955', 'AMMO2': '0.021', 'AMMO3': '0.087', 'AMMO4': '0.106', 'ARMOR': '0.108', 'WEAPON4': '0.200', 'HITCOUNT': '0.260', 'weapon4': '0.316', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.933', 'FRAGCOUNT': '1.000', 'weapon3': '1.270', 'weapon2': '2.216'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:07,983][63769] DAMAGECOUNT value on done: 3389.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:07,983][63769] Sum rewards: -6.365, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.802', 'AMMO2': '0.001', 'AMMO4': '0.005', 'AMMO5': '0.010', 'weapon5': '0.010', 'ARMOR': '0.036', 'WEAPON5': '0.100', 'HITCOUNT': '0.180', 'AMMO3': '0.204', 'DAMAGECOUNT': '0.747', 'WEAPON3': '0.800', 'weapon3': '1.360', 'weapon2': '1.734', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:08,388][63769] DAMAGECOUNT value on done: 4774.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:08,388][63769] Sum rewards: -2.783, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.640', 'AMMO5': '0.007', 'ARMOR': '0.016', 'AMMO2': '0.029', 'weapon5': '0.050', 'AMMO3': '0.081', 'AMMO4': '0.143', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON4': '0.400', 'weapon4': '0.490', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.786', 'FRAGCOUNT': '1.000', 'weapon2': '1.060', 'weapon3': '1.544'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:09,809][63770] DAMAGECOUNT value on done: 5328.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:09,809][63770] Sum rewards: 3.174, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.176', 'AMMO5': '0.018', 'AMMO2': '0.028', 'ARMOR': '0.040', 'weapon4': '0.134', 'AMMO4': '0.141', 'AMMO3': '0.167', 'weapon5': '0.236', 'WEAPON4': '0.250', 'HITCOUNT': '0.270', 'WEAPON5': '0.400', 'WEAPON3': '0.900', 'weapon2': '1.584', 'weapon3': '1.636', 'DAMAGECOUNT': '2.796', 'FRAGCOUNT': '5.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:10,200][63770] DAMAGECOUNT value on done: 3044.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:10,201][63770] Sum rewards: -4.628, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.422', 'weapon4': '0.006', 'AMMO2': '0.011', 'WEAPON1': '0.030', 'AMMO4': '0.056', 'ARMOR': '0.092', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.118', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.056', 'weapon2': '2.004'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:12,458][109198] Fps is (10 sec: 11059.4, 60 sec: 11127.5, 300 sec: 11121.7). Total num frames: 8450048. Throughput: 0: 1470.9, 1: 1304.6. Samples: 2109947. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:12,460][109198] Avg episode reward: [(0, '-2.670'), (1, '-4.712')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:12,461][63454] Saving new best policy, reward=-2.670!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:14,021][63732] Updated weights for policy 0, policy_version 1020 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:15,097][63771] DAMAGECOUNT value on done: 2745.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:15,097][63771] Sum rewards: -5.797, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.358', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'AMMO5': '0.005', 'ARMOR': '0.051', 'HITCOUNT': '0.090', 'WEAPON5': '0.100', 'AMMO3': '0.174', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.412', 'weapon2': '1.638'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:15,449][63733] Updated weights for policy 1, policy_version 1050 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:15,479][63771] DAMAGECOUNT value on done: 4421.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:15,480][63771] Sum rewards: -2.299, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.760', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'AMMO5': '0.007', 'weapon5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'weapon4': '0.064', 'AMMO3': '0.139', 'HITCOUNT': '0.200', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.810', 'weapon3': '1.508', 'weapon2': '1.762', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:15,603][63735] DAMAGECOUNT value on done: 4623.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:15,604][63735] Sum rewards: -4.235, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.646', 'AMMO2': '0.002', 'AMMO4': '0.008', 'weapon4': '0.038', 'WEAPON4': '0.050', 'AMMO3': '0.122', 'HITCOUNT': '0.150', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.795', 'FRAGCOUNT': '1.000', 'weapon3': '1.638', 'weapon2': '1.708'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:15,952][63735] DAMAGECOUNT value on done: 4408.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:15,952][63735] Sum rewards: -1.962, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.489', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO2': '0.027', 'ARMOR': '0.068', 'weapon5': '0.120', 'AMMO4': '0.134', 'AMMO3': '0.148', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'HITCOUNT': '0.280', 'weapon4': '0.322', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.020', 'weapon3': '1.224', 'weapon2': '1.802', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:16,199][63767] DAMAGECOUNT value on done: 5741.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:16,199][63767] Sum rewards: -4.756, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.157', 'AMMO2': '0.009', 'weapon4': '0.012', 'AMMO5': '0.013', 'WEAPON1': '0.030', 'AMMO4': '0.046', 'WEAPON4': '0.050', 'AMMO3': '0.170', 'weapon5': '0.174', 'WEAPON5': '0.350', 'HITCOUNT': '0.470', 'WEAPON3': '0.750', 'weapon3': '1.578', 'DAMAGECOUNT': '1.680', 'weapon2': '1.818', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:16,529][63767] DAMAGECOUNT value on done: 5167.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:16,529][63767] Sum rewards: -0.763, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.336', 'AMMO5': '0.007', 'AMMO2': '0.029', 'weapon5': '0.056', 'ARMOR': '0.064', 'AMMO4': '0.143', 'WEAPON5': '0.150', 'AMMO3': '0.162', 'WEAPON4': '0.200', 'HITCOUNT': '0.440', 'weapon2': '0.534', 'weapon4': '0.566', 'WEAPON3': '1.050', 'DAMAGECOUNT': '2.106', 'weapon3': '2.316', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:17,212][63767] DAMAGECOUNT value on done: 5375.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:17,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11127.5, 300 sec: 11121.7). Total num frames: 8507392. Throughput: 0: 1488.5, 1: 1287.8. Samples: 2118278. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:17,460][109198] Avg episode reward: [(0, '-2.674'), (1, '-4.693')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:17,536][63767] DAMAGECOUNT value on done: 5455.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:17,537][63767] Sum rewards: -5.246, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.701', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'weapon5': '0.048', 'WEAPON4': '0.050', 'AMMO4': '0.054', 'weapon4': '0.082', 'WEAPON5': '0.100', 'AMMO3': '0.162', 'HITCOUNT': '0.260', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.950', 'weapon2': '1.054', 'DAMAGECOUNT': '1.059', 'weapon3': '1.860'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:18,754][63805] DAMAGECOUNT value on done: 5344.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:18,754][63805] Sum rewards: 1.434, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.294', 'AMMO2': '0.013', 'AMMO5': '0.021', 'AMMO3': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.064', 'weapon4': '0.078', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'HITCOUNT': '0.150', 'weapon7': '0.194', 'weapon5': '0.228', 'WEAPON3': '0.350', 'WEAPON5': '0.400', 'ARMOR': '0.436', 'weapon3': '0.928', 'DAMAGECOUNT': '0.960', 'weapon2': '1.506', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:19,149][63805] DAMAGECOUNT value on done: 3830.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:19,149][63805] Sum rewards: -6.516, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.320', 'AMMO2': '0.008', 'AMMO5': '0.010', 'ARMOR': '0.040', 'AMMO4': '0.041', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.169', 'WEAPON4': '0.200', 'weapon4': '0.410', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.262', 'weapon2': '1.344'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:20,637][63732] Updated weights for policy 0, policy_version 1030 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:21,176][63735] DAMAGECOUNT value on done: 4470.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:21,176][63735] Sum rewards: -5.209, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.752', 'AMMO5': '0.008', 'AMMO2': '0.009', 'AMMO4': '0.046', 'WEAPON4': '0.050', 'weapon4': '0.068', 'weapon5': '0.096', 'WEAPON5': '0.100', 'AMMO3': '0.220', 'HITCOUNT': '0.220', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.164', 'weapon3': '1.482', 'FRAGCOUNT': '2.000', 'weapon2': '2.030'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:21,385][63770] DAMAGECOUNT value on done: 3846.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:21,386][63770] Sum rewards: -5.353, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.126', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'weapon4': '0.012', 'AMMO4': '0.017', 'ARMOR': '0.076', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.116', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.184', 'weapon2': '1.974'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:21,570][63735] DAMAGECOUNT value on done: 2963.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:21,571][63735] Sum rewards: -7.044, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.792', 'AMMO5': '0.005', 'AMMO2': '0.007', 'AMMO4': '0.034', 'HITCOUNT': '0.100', 'AMMO3': '0.158', 'DAMAGECOUNT': '0.390', 'ARMOR': '0.404', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.546', 'weapon3': '1.554'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:21,737][63770] DAMAGECOUNT value on done: 3851.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:21,737][63770] Sum rewards: 1.401, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.911', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO3': '0.060', 'weapon7': '0.090', 'HITCOUNT': '0.100', 'ARMOR': '0.104', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'WEAPON4': '0.250', 'WEAPON3': '0.500', 'weapon4': '0.550', 'DAMAGECOUNT': '0.603', 'weapon3': '1.298', 'weapon2': '1.562', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:22,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11127.4, 300 sec: 11107.8). Total num frames: 8560640. Throughput: 0: 1521.0, 1: 1249.3. Samples: 2134903. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:22,461][109198] Avg episode reward: [(0, '-2.607'), (1, '-4.768')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:22,501][63454] Saving new best policy, reward=-2.607!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:23,856][63733] Updated weights for policy 1, policy_version 1060 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:26,051][63806] DAMAGECOUNT value on done: 3954.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:26,051][63806] Sum rewards: -1.770, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.358', 'AMMO2': '0.015', 'ARMOR': '0.064', 'AMMO4': '0.076', 'HITCOUNT': '0.080', 'AMMO3': '0.092', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.225', 'weapon4': '0.328', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.136', 'weapon3': '1.622'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:26,183][63806] DAMAGECOUNT value on done: 4233.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:26,184][63806] Sum rewards: 0.336, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.542', 'AMMO2': '0.003', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.015', 'weapon7': '0.044', 'WEAPON4': '0.050', 'ARMOR': '0.056', 'weapon5': '0.108', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.140', 'AMMO3': '0.144', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.214', 'DAMAGECOUNT': '0.735', 'WEAPON3': '0.800', 'weapon2': '1.522', 'weapon3': '1.634', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:26,425][63806] DAMAGECOUNT value on done: 5585.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:26,425][63806] Sum rewards: 2.030, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.458', 'AMMO2': '0.005', 'AMMO5': '0.016', 'AMMO4': '0.026', 'weapon5': '0.154', 'AMMO3': '0.208', 'WEAPON5': '0.250', 'ARMOR': '0.483', 'HITCOUNT': '0.490', 'WEAPON3': '1.000', 'weapon2': '1.114', 'DAMAGECOUNT': '1.752', 'weapon3': '2.490', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:26,559][63806] DAMAGECOUNT value on done: 4115.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:26,559][63806] Sum rewards: 2.494, reward structure: {'DEATHCOUNT': '-9.000', 'WEAPON1': '0.010', 'AMMO5': '0.019', 'AMMO2': '0.024', 'ARMOR': '0.064', 'AMMO4': '0.118', 'AMMO3': '0.122', 'WEAPON4': '0.150', 'HEALTH': '0.164', 'weapon4': '0.228', 'WEAPON5': '0.250', 'weapon5': '0.252', 'HITCOUNT': '0.320', 'WEAPON3': '0.650', 'weapon2': '1.172', 'DAMAGECOUNT': '1.725', 'weapon3': '1.726', 'FRAGCOUNT': '4.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:27,082][63732] Updated weights for policy 0, policy_version 1040 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:27,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11127.5, 300 sec: 11135.6). Total num frames: 8617984. Throughput: 0: 1560.6, 1: 1221.7. Samples: 2151843. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:27,460][109198] Avg episode reward: [(0, '-2.497'), (1, '-4.741')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:27,465][63454] Saving new best policy, reward=-2.497!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:28,528][63734] DAMAGECOUNT value on done: 5251.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:28,821][63734] DAMAGECOUNT value on done: 3973.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:28,821][63734] Sum rewards: -2.103, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.706', 'AMMO2': '0.003', 'AMMO5': '0.011', 'AMMO4': '0.017', 'weapon5': '0.098', 'WEAPON4': '0.100', 'AMMO3': '0.175', 'WEAPON5': '0.250', 'weapon4': '0.254', 'HITCOUNT': '0.390', 'WEAPON3': '0.850', 'ARMOR': '0.915', 'weapon2': '1.470', 'FRAGCOUNT': '1.500', 'DAMAGECOUNT': '1.539', 'weapon3': '1.780'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:28,923][63734] DAMAGECOUNT value on done: 3294.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:28,924][63734] Sum rewards: -4.464, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.608', 'AMMO5': '0.005', 'AMMO2': '0.012', 'AMMO4': '0.059', 'weapon4': '0.062', 'WEAPON4': '0.100', 'AMMO3': '0.127', 'HITCOUNT': '0.240', 'ARMOR': '0.428', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.579', 'weapon3': '1.448', 'FRAGCOUNT': '2.000', 'weapon2': '2.084'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:29,000][63805] DAMAGECOUNT value on done: 4976.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:29,000][63805] Sum rewards: -7.480, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-0.869', 'AMMO5': '0.005', 'AMMO2': '0.028', 'ARMOR': '0.056', 'WEAPON5': '0.100', 'AMMO4': '0.141', 'HITCOUNT': '0.160', 'AMMO3': '0.194', 'WEAPON4': '0.200', 'weapon4': '0.260', 'DAMAGECOUNT': '0.561', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '1.512', 'weapon2': '1.722'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:29,226][63734] DAMAGECOUNT value on done: 3370.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:29,226][63734] Sum rewards: 0.695, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'ARMOR': '0.064', 'weapon4': '0.072', 'AMMO4': '0.082', 'AMMO3': '0.084', 'WEAPON4': '0.100', 'weapon5': '0.110', 'HITCOUNT': '0.120', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.330', 'HEALTH': '0.358', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.442', 'weapon2': '1.448'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:29,411][63805] DAMAGECOUNT value on done: 5208.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:29,411][63805] Sum rewards: -2.148, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.940', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.005', 'weapon5': '0.022', 'ARMOR': '0.032', 'AMMO3': '0.098', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.466', 'weapon2': '1.544'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:30,299][63771] DAMAGECOUNT value on done: 4988.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:30,299][63771] Sum rewards: -1.669, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.184', 'AMMO2': '0.014', 'AMMO5': '0.015', 'ARMOR': '0.048', 'AMMO4': '0.068', 'AMMO3': '0.088', 'weapon5': '0.092', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.130', 'weapon7': '0.154', 'WEAPON7': '0.200', 'WEAPON4': '0.250', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.342', 'WEAPON3': '0.500', 'weapon4': '0.508', 'FRAGCOUNT': '1.000', 'weapon3': '1.002', 'weapon2': '1.314'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:30,734][63771] DAMAGECOUNT value on done: 3262.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:30,735][63771] Sum rewards: -7.991, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.028', 'AMMO2': '0.011', 'AMMO5': '0.011', 'ARMOR': '0.020', 'AMMO4': '0.055', 'weapon5': '0.080', 'AMMO3': '0.160', 'HITCOUNT': '0.160', 'WEAPON5': '0.250', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.561', 'WEAPON3': '0.800', 'weapon2': '1.200', 'weapon3': '1.978'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:30,974][63769] DAMAGECOUNT value on done: 5140.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:30,975][63769] Sum rewards: -4.106, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.000', 'AMMO2': '0.009', 'AMMO5': '0.015', 'AMMO4': '0.043', 'weapon5': '0.098', 'AMMO3': '0.119', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'WEAPON5': '0.250', 'weapon4': '0.306', 'DAMAGECOUNT': '0.327', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.224', 'weapon3': '1.622'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:31,392][63769] DAMAGECOUNT value on done: 2795.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:31,392][63769] Sum rewards: -8.741, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-1.950', 'AMMO5': '0.009', 'AMMO2': '0.010', 'weapon5': '0.030', 'AMMO4': '0.049', 'ARMOR': '0.068', 'WEAPON5': '0.100', 'WEAPON4': '0.150', 'AMMO3': '0.153', 'weapon4': '0.168', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.615', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.170', 'weapon3': '2.016'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:32,311][63733] Updated weights for policy 1, policy_version 1070 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:32,458][109198] Fps is (10 sec: 11469.0, 60 sec: 11127.5, 300 sec: 11177.2). Total num frames: 8675328. Throughput: 0: 1564.6, 1: 1221.1. Samples: 2160133. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:32,460][109198] Avg episode reward: [(0, '-2.468'), (1, '-4.724')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:32,461][63454] Saving new best policy, reward=-2.468!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:33,091][63769] DAMAGECOUNT value on done: 3643.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:33,091][63769] Sum rewards: -2.413, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.300', 'AMMO5': '0.017', 'AMMO2': '0.029', 'weapon5': '0.072', 'AMMO3': '0.122', 'HITCOUNT': '0.140', 'AMMO4': '0.145', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'weapon4': '0.316', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.762', 'weapon2': '1.398', 'weapon3': '1.736', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:33,427][63769] DAMAGECOUNT value on done: 5089.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:33,427][63769] Sum rewards: -6.785, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.916', 'AMMO2': '0.006', 'WEAPON1': '0.010', 'AMMO5': '0.018', 'AMMO4': '0.029', 'weapon5': '0.038', 'ARMOR': '0.069', 'AMMO3': '0.158', 'WEAPON4': '0.200', 'weapon4': '0.206', 'HITCOUNT': '0.240', 'WEAPON5': '0.350', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.945', 'WEAPON3': '1.000', 'weapon2': '1.310', 'weapon3': '1.552'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:33,658][63732] Updated weights for policy 0, policy_version 1050 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:35,053][63770] DAMAGECOUNT value on done: 5725.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:35,054][63770] Sum rewards: 1.545, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.931', 'AMMO4': '-0.053', 'AMMO2': '-0.011', 'AMMO5': '0.014', 'weapon7': '0.064', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.141', 'HITCOUNT': '0.160', 'weapon5': '0.182', 'weapon4': '0.192', 'WEAPON5': '0.300', 'ARMOR': '0.467', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.191', 'weapon2': '1.274', 'weapon3': '1.704', 'FRAGCOUNT': '3.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:35,402][63770] DAMAGECOUNT value on done: 3149.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:35,402][63770] Sum rewards: -3.171, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.635', 'AMMO5': '0.003', 'AMMO2': '0.003', 'weapon5': '0.010', 'AMMO4': '0.016', 'WEAPON5': '0.050', 'HITCOUNT': '0.100', 'AMMO3': '0.137', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.850', 'weapon2': '1.308', 'weapon3': '1.922', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:37,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11127.5, 300 sec: 11177.2). Total num frames: 8728576. Throughput: 0: 1564.8, 1: 1219.7. Samples: 2176890. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:37,460][109198] Avg episode reward: [(0, '-2.475'), (1, '-4.758')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:37,854][63771] DAMAGECOUNT value on done: 2790.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:38,252][63771] DAMAGECOUNT value on done: 4707.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:38,252][63771] Sum rewards: -5.998, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-3.300', 'AMMO4': '-0.029', 'AMMO2': '-0.006', 'AMMO5': '0.005', 'weapon5': '0.008', 'ARMOR': '0.028', 'WEAPON5': '0.100', 'HITCOUNT': '0.180', 'AMMO3': '0.186', 'DAMAGECOUNT': '0.858', 'WEAPON3': '1.050', 'weapon2': '1.470', 'weapon3': '1.702', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:39,296][63767] DAMAGECOUNT value on done: 6180.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:39,297][63767] Sum rewards: 4.534, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-0.495', 'AMMO2': '0.001', 'AMMO4': '0.006', 'AMMO5': '0.007', 'ARMOR': '0.032', 'weapon5': '0.048', 'WEAPON5': '0.100', 'AMMO3': '0.103', 'HITCOUNT': '0.280', 'WEAPON3': '0.350', 'weapon2': '1.168', 'DAMAGECOUNT': '1.317', 'weapon3': '1.616', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:39,474][63767] DAMAGECOUNT value on done: 5634.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:39,474][63767] Sum rewards: -9.964, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.890', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'AMMO5': '0.005', 'weapon5': '0.016', 'WEAPON5': '0.050', 'ARMOR': '0.056', 'AMMO3': '0.170', 'HITCOUNT': '0.240', 'DAMAGECOUNT': '0.777', 'WEAPON3': '1.000', 'weapon2': '1.506', 'weapon3': '1.622'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:39,689][63767] DAMAGECOUNT value on done: 5454.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:39,690][63767] Sum rewards: -4.481, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.140', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'AMMO2': '0.017', 'ARMOR': '0.028', 'AMMO4': '0.085', 'WEAPON4': '0.100', 'AMMO3': '0.163', 'weapon5': '0.174', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'weapon4': '0.474', 'DAMAGECOUNT': '0.861', 'WEAPON3': '0.900', 'weapon2': '0.938', 'FRAGCOUNT': '1.000', 'weapon3': '1.922'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:39,872][63767] DAMAGECOUNT value on done: 5843.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:39,872][63767] Sum rewards: 2.237, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.038', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'weapon4': '0.102', 'AMMO3': '0.138', 'HITCOUNT': '0.370', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.164', 'weapon2': '1.284', 'weapon3': '1.654', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:40,238][63732] Updated weights for policy 0, policy_version 1060 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:40,329][63735] DAMAGECOUNT value on done: 4668.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:40,330][63735] Sum rewards: -2.262, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.149', 'AMMO5': '0.003', 'weapon5': '0.016', 'AMMO2': '0.019', 'ARMOR': '0.036', 'WEAPON5': '0.050', 'HITCOUNT': '0.060', 'AMMO4': '0.092', 'AMMO3': '0.104', 'DAMAGECOUNT': '0.135', 'WEAPON4': '0.150', 'weapon4': '0.240', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.306', 'weapon3': '1.576'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:40,697][63733] Updated weights for policy 1, policy_version 1080 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:40,706][63735] DAMAGECOUNT value on done: 4518.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:40,707][63735] Sum rewards: -7.782, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.262', 'FRAGCOUNT': '-1.500', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'AMMO5': '0.007', 'weapon5': '0.072', 'ARMOR': '0.099', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'AMMO3': '0.196', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.330', 'weapon4': '0.432', 'WEAPON3': '0.950', 'weapon3': '1.336', 'weapon2': '1.816'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:42,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11195.7, 300 sec: 11163.3). Total num frames: 8785920. Throughput: 0: 1562.0, 1: 1214.8. Samples: 2193220. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:42,460][109198] Avg episode reward: [(0, '-2.470'), (1, '-4.808')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:43,674][63805] DAMAGECOUNT value on done: 6019.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:43,674][63805] Sum rewards: -2.050, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.682', 'AMMO5': '0.007', 'AMMO2': '0.017', 'ARMOR': '0.072', 'AMMO4': '0.083', 'WEAPON5': '0.100', 'AMMO3': '0.173', 'HITCOUNT': '0.430', 'WEAPON3': '0.900', 'weapon3': '1.858', 'weapon2': '1.966', 'DAMAGECOUNT': '2.025', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:44,020][63805] DAMAGECOUNT value on done: 4020.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:44,021][63805] Sum rewards: -3.266, reward structure: {'DEATHCOUNT': '-9.000', 'AMMO2': '0.017', 'WEAPON4': '0.050', 'weapon4': '0.080', 'AMMO4': '0.083', 'HEALTH': '0.101', 'ARMOR': '0.106', 'HITCOUNT': '0.130', 'AMMO3': '0.151', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.570', 'FRAGCOUNT': '1.000', 'weapon3': '1.212', 'weapon2': '1.734'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:45,928][63735] DAMAGECOUNT value on done: 4685.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:45,928][63735] Sum rewards: -7.719, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.922', 'AMMO5': '0.003', 'AMMO2': '0.007', 'weapon5': '0.014', 'AMMO4': '0.034', 'WEAPON5': '0.050', 'ARMOR': '0.056', 'AMMO3': '0.193', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.645', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.100', 'weapon2': '1.820', 'weapon3': '1.822'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:46,334][63735] DAMAGECOUNT value on done: 2978.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:46,641][63770] DAMAGECOUNT value on done: 4101.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:46,641][63770] Sum rewards: -5.735, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.420', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'AMMO5': '0.007', 'weapon5': '0.038', 'WEAPON5': '0.150', 'AMMO3': '0.157', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.765', 'WEAPON3': '0.900', 'weapon2': '1.446', 'weapon3': '1.558', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:46,861][63732] Updated weights for policy 0, policy_version 1070 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:47,096][63770] DAMAGECOUNT value on done: 3959.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:47,097][63770] Sum rewards: 0.577, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.423', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.020', 'AMMO4': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.119', 'weapon5': '0.120', 'HITCOUNT': '0.130', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.324', 'weapon4': '0.426', 'ARMOR': '0.480', 'WEAPON3': '0.750', 'weapon2': '1.190', 'weapon3': '1.826', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:47,458][109198] Fps is (10 sec: 10649.7, 60 sec: 11059.2, 300 sec: 11149.5). Total num frames: 8835072. Throughput: 0: 1558.2, 1: 1213.9. Samples: 2201378. Policy #0 lag: (min: 0.0, avg: 0.3, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:47,460][109198] Avg episode reward: [(0, '-2.434'), (1, '-4.828')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:47,466][63454] Saving new best policy, reward=-2.434!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:49,230][63733] Updated weights for policy 1, policy_version 1090 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:49,392][63806] DAMAGECOUNT value on done: 4533.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:49,393][63806] Sum rewards: -5.620, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.504', 'AMMO5': '0.005', 'AMMO2': '0.008', 'AMMO4': '0.040', 'ARMOR': '0.046', 'WEAPON5': '0.100', 'AMMO3': '0.174', 'WEAPON4': '0.200', 'HITCOUNT': '0.290', 'weapon4': '0.482', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.330', 'weapon3': '1.658'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:49,750][63806] DAMAGECOUNT value on done: 4385.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:49,750][63806] Sum rewards: -1.281, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.800', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.005', 'weapon4': '0.040', 'ARMOR': '0.052', 'weapon5': '0.054', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.151', 'HITCOUNT': '0.230', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.810', 'weapon2': '1.622', 'weapon3': '1.816', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:50,569][63806] DAMAGECOUNT value on done: 3991.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:50,570][63806] Sum rewards: -10.948, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.804', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.010', 'AMMO2': '0.021', 'weapon5': '0.034', 'HITCOUNT': '0.040', 'WEAPON5': '0.100', 'AMMO4': '0.103', 'DAMAGECOUNT': '0.111', 'weapon4': '0.134', 'AMMO3': '0.163', 'WEAPON4': '0.200', 'ARMOR': '0.464', 'WEAPON3': '0.950', 'weapon3': '1.352', 'weapon2': '1.424'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:50,943][63806] DAMAGECOUNT value on done: 5915.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:50,943][63806] Sum rewards: -1.128, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.274', 'AMMO5': '0.003', 'AMMO2': '0.015', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'weapon5': '0.054', 'weapon7': '0.068', 'AMMO4': '0.073', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.131', 'WEAPON7': '0.200', 'weapon4': '0.214', 'HITCOUNT': '0.310', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.990', 'FRAGCOUNT': '1.000', 'weapon3': '1.360', 'weapon2': '1.988'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:52,458][109198] Fps is (10 sec: 10649.5, 60 sec: 11059.2, 300 sec: 11149.5). Total num frames: 8892416. Throughput: 0: 1558.8, 1: 1214.5. Samples: 2218034. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:52,460][109198] Avg episode reward: [(0, '-2.471'), (1, '-4.901')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:52,730][63734] DAMAGECOUNT value on done: 4345.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:52,731][63734] Sum rewards: -1.936, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.452', 'AMMO5': '0.009', 'AMMO2': '0.011', 'ARMOR': '0.024', 'weapon7': '0.050', 'AMMO4': '0.054', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon5': '0.132', 'AMMO3': '0.142', 'HITCOUNT': '0.160', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.116', 'weapon3': '1.534', 'weapon2': '1.894'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:53,115][63734] DAMAGECOUNT value on done: 3602.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:53,116][63734] Sum rewards: -3.988, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.469', 'AMMO5': '0.012', 'AMMO2': '0.036', 'ARMOR': '0.072', 'weapon5': '0.082', 'WEAPON4': '0.150', 'AMMO3': '0.158', 'weapon4': '0.172', 'AMMO4': '0.179', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.696', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.500', 'weapon2': '1.672', 'weapon3': '1.792'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:53,451][63732] Updated weights for policy 0, policy_version 1080 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:53,829][63734] DAMAGECOUNT value on done: 5501.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:53,829][63734] Sum rewards: -1.849, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.790', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.014', 'weapon4': '0.034', 'WEAPON5': '0.050', 'AMMO4': '0.068', 'AMMO3': '0.088', 'WEAPON4': '0.150', 'HITCOUNT': '0.240', 'ARMOR': '0.400', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.472', 'weapon3': '1.612'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:53,929][63805] DAMAGECOUNT value on done: 5314.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:53,929][63805] Sum rewards: -0.089, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.352', 'AMMO2': '0.001', 'AMMO4': '0.007', 'AMMO5': '0.010', 'ARMOR': '0.064', 'weapon5': '0.130', 'AMMO3': '0.159', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.014', 'weapon3': '1.388', 'weapon2': '1.810', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:54,272][63734] DAMAGECOUNT value on done: 3567.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:54,273][63734] Sum rewards: -5.465, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.410', 'weapon7': '0.006', 'AMMO2': '0.010', 'AMMO5': '0.013', 'weapon5': '0.016', 'AMMO4': '0.050', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.124', 'AMMO3': '0.175', 'WEAPON5': '0.200', 'HITCOUNT': '0.270', 'DAMAGECOUNT': '0.819', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.172', 'weapon3': '1.990'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:54,361][63805] DAMAGECOUNT value on done: 5433.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:54,361][63805] Sum rewards: -4.144, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.416', 'AMMO5': '0.003', 'weapon5': '0.008', 'AMMO2': '0.021', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.102', 'AMMO3': '0.133', 'HITCOUNT': '0.150', 'weapon4': '0.192', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.146', 'weapon3': '1.742'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:54,915][63769] DAMAGECOUNT value on done: 5503.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:54,915][63769] Sum rewards: -0.099, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.160', 'AMMO2': '0.010', 'AMMO5': '0.013', 'ARMOR': '0.032', 'AMMO4': '0.050', 'weapon5': '0.068', 'WEAPON4': '0.100', 'HITCOUNT': '0.160', 'AMMO3': '0.174', 'weapon4': '0.188', 'WEAPON5': '0.200', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.089', 'weapon3': '1.296', 'weapon2': '2.082', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:55,229][63769] DAMAGECOUNT value on done: 3178.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:55,229][63769] Sum rewards: 1.073, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.950', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'ARMOR': '0.012', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'weapon5': '0.124', 'AMMO3': '0.196', 'WEAPON5': '0.200', 'HITCOUNT': '0.280', 'WEAPON3': '0.950', 'weapon2': '1.102', 'DAMAGECOUNT': '1.149', 'weapon3': '2.258', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:55,568][63771] DAMAGECOUNT value on done: 5244.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:55,569][63771] Sum rewards: 0.717, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.036', 'AMMO4': '-0.032', 'AMMO2': '-0.006', 'AMMO5': '0.005', 'AMMO3': '0.091', 'ARMOR': '0.123', 'HITCOUNT': '0.180', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.768', 'weapon3': '1.748', 'FRAGCOUNT': '2.000', 'weapon2': '2.026'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:55,955][63771] DAMAGECOUNT value on done: 3572.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:55,955][63771] Sum rewards: -2.285, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.558', 'AMMO2': '0.011', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'AMMO4': '0.056', 'AMMO3': '0.155', 'weapon4': '0.180', 'HITCOUNT': '0.220', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.930', 'weapon2': '1.288', 'weapon3': '1.596', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:57,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11127.5, 300 sec: 11149.5). Total num frames: 8949760. Throughput: 0: 1558.1, 1: 1211.6. Samples: 2234586. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:49:57,460][109198] Avg episode reward: [(0, '-2.441'), (1, '-4.832')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:57,746][63733] Updated weights for policy 1, policy_version 1100 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:58,239][63769] DAMAGECOUNT value on done: 3750.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:58,239][63769] Sum rewards: -5.332, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.410', 'ARMOR': '0.004', 'AMMO5': '0.015', 'AMMO2': '0.022', 'weapon5': '0.050', 'HITCOUNT': '0.080', 'AMMO4': '0.110', 'AMMO3': '0.126', 'weapon4': '0.136', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.321', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.266', 'weapon3': '1.998'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:58,693][63769] DAMAGECOUNT value on done: 5289.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:49:58,693][63769] Sum rewards: -0.987, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.122', 'AMMO2': '0.003', 'AMMO4': '0.014', 'AMMO3': '0.101', 'WEAPON4': '0.150', 'HITCOUNT': '0.210', 'weapon4': '0.232', 'ARMOR': '0.521', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.600', 'weapon2': '1.434', 'weapon3': '1.520', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:00,012][63732] Updated weights for policy 0, policy_version 1090 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:00,514][63770] DAMAGECOUNT value on done: 5920.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:00,515][63770] Sum rewards: -1.643, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.610', 'AMMO5': '0.015', 'AMMO2': '0.023', 'HITCOUNT': '0.080', 'AMMO4': '0.113', 'AMMO3': '0.130', 'weapon5': '0.158', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'weapon4': '0.416', 'ARMOR': '0.476', 'DAMAGECOUNT': '0.585', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.134', 'weapon3': '1.236'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:00,611][63771] DAMAGECOUNT value on done: 2915.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:00,611][63771] Sum rewards: 0.142, reward structure: {'DEATHCOUNT': '-5.250', 'weapon5': '0.010', 'AMMO2': '0.010', 'AMMO5': '0.012', 'ARMOR': '0.028', 'WEAPON4': '0.050', 'AMMO4': '0.051', 'AMMO3': '0.054', 'HITCOUNT': '0.120', 'WEAPON5': '0.150', 'weapon4': '0.164', 'HEALTH': '0.303', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.375', 'weapon3': '0.846', 'FRAGCOUNT': '1.000', 'weapon2': '1.868'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:00,909][63770] DAMAGECOUNT value on done: 3189.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:00,960][63771] DAMAGECOUNT value on done: 4832.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:01,809][63767] DAMAGECOUNT value on done: 5674.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:01,809][63767] Sum rewards: -6.411, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.580', 'FRAGCOUNT': '-1.500', 'AMMO2': '0.000', 'AMMO4': '0.001', 'AMMO5': '0.005', 'weapon5': '0.056', 'HITCOUNT': '0.060', 'weapon4': '0.080', 'AMMO3': '0.091', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.120', 'WEAPON4': '0.150', 'ARMOR': '0.596', 'WEAPON3': '0.600', 'weapon3': '1.354', 'weapon2': '1.706'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:02,199][63767] DAMAGECOUNT value on done: 5998.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:02,416][63767] DAMAGECOUNT value on done: 6512.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:02,416][63767] Sum rewards: -6.084, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.962', 'AMMO5': '0.007', 'AMMO2': '0.008', 'ARMOR': '0.028', 'AMMO4': '0.037', 'WEAPON4': '0.050', 'weapon5': '0.072', 'weapon4': '0.096', 'WEAPON5': '0.100', 'AMMO3': '0.147', 'HITCOUNT': '0.160', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.996', 'FRAGCOUNT': '1.000', 'weapon3': '1.654', 'weapon2': '1.722'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:02,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11059.2, 300 sec: 11149.5). Total num frames: 9003008. Throughput: 0: 1559.7, 1: 1214.0. Samples: 2243095. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:02,460][109198] Avg episode reward: [(0, '-2.478'), (1, '-4.705')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:02,811][63767] DAMAGECOUNT value on done: 5935.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:02,811][63767] Sum rewards: 2.530, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.120', 'AMMO4': '-0.068', 'AMMO2': '-0.013', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'weapon5': '0.098', 'WEAPON5': '0.100', 'AMMO3': '0.125', 'HITCOUNT': '0.310', 'WEAPON3': '0.700', 'weapon2': '1.292', 'DAMAGECOUNT': '1.443', 'weapon3': '1.866', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:02,855][63806] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:05,113][63735] DAMAGECOUNT value on done: 4858.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:05,114][63735] Sum rewards: -4.463, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.503', 'AMMO5': '0.003', 'AMMO2': '0.006', 'WEAPON1': '0.010', 'AMMO4': '0.029', 'ARMOR': '0.048', 'WEAPON5': '0.050', 'AMMO3': '0.093', 'WEAPON4': '0.100', 'weapon4': '0.134', 'HITCOUNT': '0.150', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.600', 'weapon3': '1.498', 'weapon2': '1.500', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:05,528][63735] DAMAGECOUNT value on done: 4690.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:05,528][63735] Sum rewards: -5.337, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.230', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'AMMO5': '0.005', 'ARMOR': '0.032', 'weapon5': '0.078', 'WEAPON4': '0.100', 'weapon7': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.130', 'AMMO3': '0.140', 'WEAPON5': '0.150', 'weapon4': '0.188', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.516', 'WEAPON3': '0.900', 'weapon2': '0.976', 'weapon3': '1.156'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:06,063][63733] Updated weights for policy 1, policy_version 1110 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:06,496][63732] Updated weights for policy 0, policy_version 1100 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:07,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11127.5, 300 sec: 11149.5). Total num frames: 9060352. Throughput: 0: 1561.2, 1: 1216.0. Samples: 2259876. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:07,460][109198] Avg episode reward: [(0, '-2.430'), (1, '-4.722')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:07,465][63454] Saving new best policy, reward=-2.430!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:08,683][63805] DAMAGECOUNT value on done: 6481.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:08,684][63805] Sum rewards: 2.327, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.410', 'AMMO2': '0.004', 'AMMO5': '0.007', 'AMMO4': '0.022', 'weapon5': '0.056', 'ARMOR': '0.092', 'WEAPON4': '0.100', 'AMMO3': '0.109', 'WEAPON5': '0.150', 'HITCOUNT': '0.240', 'weapon4': '0.326', 'WEAPON3': '0.550', 'weapon2': '0.856', 'DAMAGECOUNT': '1.386', 'weapon3': '1.588', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:09,014][63805] DAMAGECOUNT value on done: 4108.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:10,720][63735] DAMAGECOUNT value on done: 4896.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:10,720][63735] Sum rewards: -5.510, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.742', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'WEAPON1': '0.020', 'AMMO5': '0.025', 'ARMOR': '0.060', 'weapon5': '0.062', 'HITCOUNT': '0.170', 'AMMO3': '0.171', 'WEAPON5': '0.450', 'DAMAGECOUNT': '0.633', 'WEAPON3': '0.900', 'weapon3': '1.492', 'weapon2': '1.774'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:11,119][63735] DAMAGECOUNT value on done: 3113.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:11,120][63735] Sum rewards: -6.159, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.528', 'AMMO2': '0.001', 'AMMO4': '0.005', 'ARMOR': '0.036', 'HITCOUNT': '0.150', 'AMMO3': '0.182', 'DAMAGECOUNT': '0.405', 'WEAPON3': '1.100', 'weapon2': '1.260', 'FRAGCOUNT': '2.000', 'weapon3': '2.230'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:12,068][63770] DAMAGECOUNT value on done: 4239.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:12,145][63806] DAMAGECOUNT value on done: 4913.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:12,145][63806] Sum rewards: -3.971, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.884', 'ARMOR': '0.008', 'AMMO5': '0.012', 'AMMO2': '0.014', 'weapon5': '0.042', 'weapon4': '0.048', 'WEAPON4': '0.050', 'AMMO4': '0.071', 'AMMO3': '0.116', 'WEAPON5': '0.250', 'HITCOUNT': '0.310', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.140', 'FRAGCOUNT': '1.500', 'weapon2': '1.580', 'weapon3': '1.872'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:12,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11127.4, 300 sec: 11163.3). Total num frames: 9117696. Throughput: 0: 1556.7, 1: 1212.0. Samples: 2276435. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:12,460][109198] Avg episode reward: [(0, '-2.417'), (1, '-4.807')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:12,462][63454] Saving new best policy, reward=-2.417!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:12,468][63770] DAMAGECOUNT value on done: 4360.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:12,469][63770] Sum rewards: 0.334, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.904', 'AMMO4': '-0.037', 'AMMO2': '-0.007', 'AMMO5': '0.015', 'ARMOR': '0.057', 'weapon5': '0.110', 'AMMO3': '0.131', 'HITCOUNT': '0.190', 'WEAPON5': '0.250', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.203', 'weapon2': '1.698', 'weapon3': '1.778', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:12,543][63806] DAMAGECOUNT value on done: 4863.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:12,543][63806] Sum rewards: -5.032, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.446', 'AMMO5': '0.007', 'AMMO2': '0.011', 'weapon4': '0.044', 'weapon5': '0.048', 'WEAPON4': '0.050', 'AMMO4': '0.054', 'ARMOR': '0.064', 'WEAPON5': '0.150', 'AMMO3': '0.196', 'HITCOUNT': '0.360', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.434', 'FRAGCOUNT': '1.500', 'weapon2': '1.564', 'weapon3': '2.032'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:13,077][63732] Updated weights for policy 0, policy_version 1110 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:14,487][63733] Updated weights for policy 1, policy_version 1120 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:14,795][63806] DAMAGECOUNT value on done: 4266.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:14,796][63806] Sum rewards: -7.925, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.758', 'AMMO2': '0.002', 'AMMO4': '0.011', 'weapon7': '0.030', 'ARMOR': '0.040', 'weapon4': '0.042', 'WEAPON4': '0.050', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.147', 'HITCOUNT': '0.220', 'DAMAGECOUNT': '0.825', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.606', 'weapon3': '1.610'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:15,190][63806] DAMAGECOUNT value on done: 6081.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:15,191][63806] Sum rewards: -4.691, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.176', 'AMMO4': '-0.073', 'AMMO2': '-0.015', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'ARMOR': '0.036', 'weapon5': '0.108', 'HITCOUNT': '0.170', 'AMMO3': '0.172', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.498', 'WEAPON3': '0.550', 'weapon3': '1.420', 'FRAGCOUNT': '2.000', 'weapon2': '2.092'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:16,144][63734] DAMAGECOUNT value on done: 4493.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:16,541][63734] DAMAGECOUNT value on done: 3746.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:16,541][63734] Sum rewards: -4.930, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.440', 'AMMO5': '0.009', 'AMMO2': '0.022', 'weapon5': '0.070', 'ARMOR': '0.072', 'AMMO4': '0.108', 'HITCOUNT': '0.150', 'AMMO3': '0.165', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.432', 'WEAPON3': '0.850', 'weapon2': '1.746', 'weapon3': '1.936'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:17,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11059.2, 300 sec: 11135.6). Total num frames: 9170944. Throughput: 0: 1559.3, 1: 1211.2. Samples: 2284805. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:17,460][109198] Avg episode reward: [(0, '-2.450'), (1, '-4.817')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:18,347][63769] DAMAGECOUNT value on done: 5766.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:18,347][63769] Sum rewards: -4.454, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.471', 'AMMO2': '0.009', 'AMMO5': '0.011', 'ARMOR': '0.028', 'AMMO4': '0.043', 'weapon5': '0.056', 'WEAPON4': '0.100', 'AMMO3': '0.137', 'WEAPON5': '0.150', 'weapon4': '0.172', 'HITCOUNT': '0.260', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.789', 'FRAGCOUNT': '1.000', 'weapon2': '1.574', 'weapon3': '1.688'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:18,689][63769] DAMAGECOUNT value on done: 3610.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:18,689][63769] Sum rewards: -3.923, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.398', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'AMMO5': '0.017', 'AMMO3': '0.173', 'weapon5': '0.192', 'HITCOUNT': '0.290', 'WEAPON5': '0.400', 'WEAPON3': '0.700', 'weapon3': '1.164', 'DAMAGECOUNT': '1.296', 'FRAGCOUNT': '1.500', 'weapon2': '2.274'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:18,754][63734] DAMAGECOUNT value on done: 5653.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:18,755][63734] Sum rewards: -4.154, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '0.000', 'weapon4': '0.028', 'AMMO2': '0.030', 'ARMOR': '0.048', 'weapon7': '0.086', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.110', 'AMMO4': '0.150', 'HITCOUNT': '0.150', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.456', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.452', 'weapon3': '1.736'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:19,097][63805] DAMAGECOUNT value on done: 5762.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:19,097][63805] Sum rewards: -0.005, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.875', 'AMMO4': '-0.052', 'AMMO2': '-0.010', 'ARMOR': '0.008', 'WEAPON4': '0.050', 'weapon7': '0.088', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.146', 'weapon4': '0.168', 'WEAPON7': '0.200', 'HITCOUNT': '0.300', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.344', 'weapon3': '1.474', 'weapon2': '1.564', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:19,145][63734] DAMAGECOUNT value on done: 4052.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:19,146][63734] Sum rewards: 4.076, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.275', 'AMMO4': '-0.000', 'AMMO2': '0.000', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'ARMOR': '0.032', 'AMMO3': '0.111', 'weapon5': '0.200', 'HITCOUNT': '0.270', 'WEAPON5': '0.300', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.455', 'weapon2': '1.632', 'weapon3': '1.674', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:19,458][63805] DAMAGECOUNT value on done: 5488.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:19,637][63732] Updated weights for policy 0, policy_version 1120 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:20,456][63771] DAMAGECOUNT value on done: 5417.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:20,457][63771] Sum rewards: -3.530, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.025', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.009', 'WEAPON1': '0.030', 'ARMOR': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.124', 'HITCOUNT': '0.180', 'weapon5': '0.210', 'WEAPON5': '0.250', 'weapon4': '0.270', 'DAMAGECOUNT': '0.519', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.286', 'weapon3': '1.892'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:20,850][63771] DAMAGECOUNT value on done: 3792.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:20,851][63771] Sum rewards: -6.214, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.988', 'AMMO4': '-0.038', 'AMMO2': '-0.008', 'AMMO5': '0.013', 'ARMOR': '0.020', 'weapon4': '0.032', 'weapon5': '0.064', 'WEAPON4': '0.100', 'AMMO3': '0.101', 'WEAPON5': '0.150', 'HITCOUNT': '0.180', 'DAMAGECOUNT': '0.660', 'WEAPON3': '0.700', 'weapon3': '1.484', 'weapon2': '1.816', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:22,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11127.5, 300 sec: 11149.4). Total num frames: 9228288. Throughput: 0: 1557.2, 1: 1210.5. Samples: 2301438. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:22,460][109198] Avg episode reward: [(0, '-2.450'), (1, '-4.843')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:22,533][63806] Large shaping reward -2.504 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.255, -85.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:22,907][63733] Updated weights for policy 1, policy_version 1130 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:23,195][63769] DAMAGECOUNT value on done: 4105.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:23,195][63769] Sum rewards: -4.053, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.594', 'AMMO5': '0.005', 'AMMO2': '0.013', 'weapon5': '0.024', 'ARMOR': '0.064', 'AMMO4': '0.065', 'WEAPON5': '0.100', 'AMMO3': '0.132', 'HITCOUNT': '0.290', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.065', 'weapon2': '1.438', 'weapon3': '1.996'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:23,422][63771] DAMAGECOUNT value on done: 2999.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:23,591][63769] DAMAGECOUNT value on done: 5835.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:23,592][63769] Sum rewards: 1.567, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.270', 'AMMO2': '0.004', 'ARMOR': '0.005', 'AMMO4': '0.022', 'AMMO3': '0.122', 'HITCOUNT': '0.390', 'WEAPON3': '0.650', 'weapon2': '1.540', 'DAMAGECOUNT': '1.638', 'weapon3': '1.716', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:23,817][63771] DAMAGECOUNT value on done: 4932.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:23,817][63771] Sum rewards: -1.359, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.454', 'AMMO5': '0.003', 'AMMO2': '0.009', 'weapon5': '0.022', 'ARMOR': '0.044', 'AMMO4': '0.044', 'WEAPON5': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.077', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon2': '1.470', 'weapon3': '1.516'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:23,968][63767] DAMAGECOUNT value on done: 5931.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:23,968][63767] Sum rewards: -4.164, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.105', 'AMMO2': '0.007', 'weapon4': '0.010', 'AMMO4': '0.033', 'ARMOR': '0.040', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'HITCOUNT': '0.170', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.771', 'FRAGCOUNT': '1.000', 'weapon3': '1.608', 'weapon2': '1.694'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:24,300][63767] DAMAGECOUNT value on done: 6138.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:24,301][63767] Sum rewards: -6.098, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.264', 'AMMO2': '0.006', 'AMMO5': '0.012', 'weapon5': '0.018', 'AMMO4': '0.030', 'WEAPON4': '0.050', 'weapon7': '0.050', 'ARMOR': '0.068', 'HITCOUNT': '0.110', 'weapon4': '0.140', 'AMMO3': '0.151', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.338', 'weapon3': '1.702'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:25,303][63767] DAMAGECOUNT value on done: 6988.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:25,304][63767] Sum rewards: 0.873, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.484', 'AMMO4': '-0.041', 'AMMO2': '-0.008', 'AMMO5': '0.011', 'ARMOR': '0.060', 'AMMO3': '0.155', 'weapon5': '0.158', 'HITCOUNT': '0.290', 'WEAPON5': '0.300', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.428', 'weapon3': '1.754', 'weapon2': '1.800', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:25,662][63770] DAMAGECOUNT value on done: 6053.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:25,711][63767] DAMAGECOUNT value on done: 6497.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:25,712][63767] Sum rewards: 2.412, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.350', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'AMMO5': '0.007', 'ARMOR': '0.040', 'weapon7': '0.064', 'weapon5': '0.090', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.121', 'WEAPON5': '0.150', 'weapon4': '0.154', 'WEAPON7': '0.200', 'HITCOUNT': '0.310', 'WEAPON3': '0.750', 'weapon2': '1.500', 'weapon3': '1.614', 'DAMAGECOUNT': '1.686', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:26,007][63770] DAMAGECOUNT value on done: 3338.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:26,007][63770] Sum rewards: -3.488, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.118', 'AMMO4': '-0.004', 'AMMO2': '-0.001', 'WEAPON4': '0.050', 'HITCOUNT': '0.090', 'AMMO3': '0.101', 'DAMAGECOUNT': '0.447', 'ARMOR': '0.504', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.286', 'weapon2': '1.806'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:26,110][63732] Updated weights for policy 0, policy_version 1130 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:27,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11127.4, 300 sec: 11163.3). Total num frames: 9285632. Throughput: 0: 1564.0, 1: 1215.1. Samples: 2318279. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:27,460][109198] Avg episode reward: [(0, '-2.259'), (1, '-4.694')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:27,466][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001135_4648960.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:27,467][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001132_4636672.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:27,521][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000799_3272704.pth\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:27,524][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000814_3334144.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:27,529][63454] Saving new best policy, reward=-2.259!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:29,926][63735] DAMAGECOUNT value on done: 5108.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:29,927][63735] Sum rewards: -4.097, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.763', 'AMMO2': '0.021', 'weapon4': '0.054', 'ARMOR': '0.060', 'AMMO4': '0.103', 'AMMO3': '0.116', 'HITCOUNT': '0.150', 'WEAPON4': '0.200', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.750', 'weapon3': '1.516', 'weapon2': '1.596', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:30,334][63735] DAMAGECOUNT value on done: 5064.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:30,334][63735] Sum rewards: 1.088, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.361', 'AMMO4': '-0.028', 'AMMO2': '-0.005', 'AMMO5': '0.008', 'AMMO3': '0.056', 'ARMOR': '0.064', 'weapon5': '0.086', 'weapon7': '0.102', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'WEAPON5': '0.200', 'HITCOUNT': '0.280', 'WEAPON3': '0.450', 'weapon3': '1.104', 'DAMAGECOUNT': '1.122', 'weapon2': '1.570', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:31,375][63733] Updated weights for policy 1, policy_version 1140 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:32,458][109198] Fps is (10 sec: 11059.4, 60 sec: 11059.2, 300 sec: 11149.5). Total num frames: 9338880. Throughput: 0: 1567.4, 1: 1216.1. Samples: 2326636. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:32,460][109198] Avg episode reward: [(0, '-2.208'), (1, '-4.703')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:32,461][63454] Saving new best policy, reward=-2.208!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:32,679][63732] Updated weights for policy 0, policy_version 1140 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:33,602][63805] DAMAGECOUNT value on done: 6681.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:33,603][63805] Sum rewards: -0.317, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.086', 'AMMO2': '0.016', 'AMMO5': '0.022', 'AMMO4': '0.082', 'AMMO3': '0.083', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'weapon5': '0.184', 'WEAPON5': '0.350', 'weapon4': '0.402', 'ARMOR': '0.555', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.228', 'weapon3': '1.366'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:34,064][63805] DAMAGECOUNT value on done: 4203.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:34,065][63805] Sum rewards: -3.477, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.004', 'AMMO4': '-0.043', 'AMMO2': '-0.009', 'AMMO5': '0.007', 'weapon5': '0.026', 'ARMOR': '0.028', 'WEAPON5': '0.050', 'HITCOUNT': '0.100', 'AMMO3': '0.127', 'weapon6': '0.128', 'AMMO6': '0.172', 'AMMO7': '0.172', 'WEAPON6': '0.200', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.388', 'weapon2': '1.744'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:35,115][63806] DAMAGECOUNT value on done: 5375.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:35,115][63806] Sum rewards: 0.043, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.280', 'WEAPON1': '0.010', 'AMMO5': '0.018', 'AMMO2': '0.018', 'weapon5': '0.020', 'ARMOR': '0.080', 'AMMO4': '0.090', 'AMMO3': '0.123', 'WEAPON4': '0.150', 'weapon4': '0.214', 'WEAPON5': '0.250', 'HITCOUNT': '0.280', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.386', 'weapon3': '1.720', 'weapon2': '1.764'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:35,490][63735] DAMAGECOUNT value on done: 5333.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:35,491][63735] Sum rewards: -1.875, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.710', 'AMMO4': '-0.076', 'AMMO2': '-0.015', 'AMMO5': '0.007', 'weapon5': '0.074', 'AMMO3': '0.160', 'WEAPON5': '0.200', 'HITCOUNT': '0.330', 'ARMOR': '0.495', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.311', 'weapon2': '1.522', 'weapon3': '1.926', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:35,502][63806] DAMAGECOUNT value on done: 5186.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:35,502][63806] Sum rewards: -6.313, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-3.320', 'AMMO4': '-0.053', 'AMMO2': '-0.011', 'ARMOR': '0.014', 'AMMO5': '0.015', 'weapon5': '0.174', 'AMMO3': '0.196', 'HITCOUNT': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.969', 'WEAPON3': '1.200', 'weapon2': '1.542', 'weapon3': '1.710', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:35,883][63735] DAMAGECOUNT value on done: 3132.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:35,884][63735] Sum rewards: -7.193, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.387', 'AMMO2': '0.021', 'HITCOUNT': '0.040', 'DAMAGECOUNT': '0.057', 'ARMOR': '0.064', 'AMMO4': '0.107', 'AMMO3': '0.125', 'WEAPON4': '0.300', 'weapon4': '0.310', 'WEAPON3': '0.550', 'weapon3': '0.892', 'FRAGCOUNT': '1.000', 'weapon2': '1.978'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:37,236][63770] DAMAGECOUNT value on done: 4579.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:37,236][63770] Sum rewards: 3.938, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.426', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.011', 'weapon5': '0.050', 'ARMOR': '0.072', 'WEAPON5': '0.100', 'AMMO3': '0.115', 'HITCOUNT': '0.220', 'WEAPON4': '0.250', 'weapon4': '0.322', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.020', 'weapon2': '1.364', 'weapon3': '1.382', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:37,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11127.5, 300 sec: 11149.5). Total num frames: 9396224. Throughput: 0: 1565.4, 1: 1214.8. Samples: 2343142. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:37,460][109198] Avg episode reward: [(0, '-2.119'), (1, '-4.587')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:37,466][63454] Saving new best policy, reward=-2.119!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:37,622][63770] DAMAGECOUNT value on done: 4410.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:39,084][63806] DAMAGECOUNT value on done: 4369.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:39,084][63806] Sum rewards: -3.943, reward structure: {'DEATHCOUNT': '-6.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.790', 'AMMO4': '-0.033', 'AMMO2': '-0.006', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'weapon5': '0.072', 'AMMO3': '0.090', 'HITCOUNT': '0.090', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.309', 'WEAPON3': '0.650', 'weapon2': '1.462', 'weapon3': '1.546'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:39,300][63732] Updated weights for policy 0, policy_version 1150 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:39,492][63806] DAMAGECOUNT value on done: 6255.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:39,493][63806] Sum rewards: -1.247, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.892', 'AMMO5': '0.005', 'AMMO2': '0.009', 'weapon5': '0.030', 'AMMO4': '0.043', 'ARMOR': '0.084', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.143', 'weapon4': '0.250', 'DAMAGECOUNT': '0.522', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.594', 'weapon3': '1.626'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:39,747][63733] Updated weights for policy 1, policy_version 1150 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:39,926][63734] DAMAGECOUNT value on done: 4658.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:40,261][63734] DAMAGECOUNT value on done: 4037.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:40,262][63734] Sum rewards: -1.096, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.518', 'AMMO2': '0.006', 'WEAPON1': '0.010', 'weapon5': '0.012', 'AMMO5': '0.012', 'AMMO4': '0.032', 'WEAPON4': '0.100', 'ARMOR': '0.116', 'WEAPON5': '0.150', 'AMMO3': '0.168', 'weapon4': '0.206', 'HITCOUNT': '0.270', 'DAMAGECOUNT': '0.873', 'WEAPON3': '1.000', 'weapon2': '1.584', 'weapon3': '1.882', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:41,850][63769] DAMAGECOUNT value on done: 5973.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:41,850][63769] Sum rewards: -4.961, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.640', 'AMMO2': '0.002', 'AMMO5': '0.010', 'AMMO4': '0.010', 'weapon7': '0.048', 'ARMOR': '0.056', 'weapon5': '0.084', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.150', 'AMMO3': '0.159', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.621', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.558', 'weapon2': '1.940'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:42,252][63769] DAMAGECOUNT value on done: 3835.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:42,253][63769] Sum rewards: -7.450, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.240', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'AMMO5': '0.005', 'ARMOR': '0.024', 'weapon5': '0.042', 'WEAPON5': '0.050', 'HITCOUNT': '0.190', 'AMMO3': '0.210', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.466', 'weapon2': '2.230'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:42,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11059.2, 300 sec: 11135.6). Total num frames: 9449472. Throughput: 0: 1563.6, 1: 1214.8. Samples: 2359611. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:42,460][109198] Avg episode reward: [(0, '-2.335'), (1, '-4.579')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:44,079][63734] DAMAGECOUNT value on done: 6048.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:44,080][63734] Sum rewards: -4.698, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.678', 'AMMO2': '0.008', 'AMMO4': '0.041', 'ARMOR': '0.088', 'WEAPON4': '0.150', 'AMMO3': '0.172', 'HITCOUNT': '0.280', 'weapon4': '0.304', 'WEAPON3': '1.100', 'weapon2': '1.126', 'DAMAGECOUNT': '1.185', 'weapon3': '1.776', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:44,092][63805] DAMAGECOUNT value on done: 6316.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:44,093][63805] Sum rewards: 4.692, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.465', 'AMMO2': '0.005', 'AMMO5': '0.017', 'AMMO4': '0.026', 'ARMOR': '0.060', 'weapon4': '0.068', 'weapon7': '0.070', 'AMMO3': '0.096', 'WEAPON4': '0.100', 'weapon5': '0.112', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.320', 'WEAPON3': '0.550', 'weapon2': '1.544', 'weapon3': '1.636', 'DAMAGECOUNT': '1.662', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:44,449][63734] DAMAGECOUNT value on done: 4706.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:44,450][63734] Sum rewards: 0.500, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.890', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'AMMO3': '0.149', 'WEAPON5': '0.200', 'weapon5': '0.208', 'HITCOUNT': '0.390', 'WEAPON3': '0.700', 'weapon2': '1.220', 'DAMAGECOUNT': '1.941', 'weapon3': '2.060', 'FRAGCOUNT': '3.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:44,472][63805] DAMAGECOUNT value on done: 5643.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:45,456][63771] DAMAGECOUNT value on done: 5692.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:45,457][63771] Sum rewards: 3.454, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.010', 'AMMO2': '0.019', 'WEAPON1': '0.020', 'weapon7': '0.046', 'AMMO4': '0.094', 'weapon5': '0.098', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.106', 'WEAPON4': '0.150', 'HEALTH': '0.152', 'WEAPON5': '0.200', 'HITCOUNT': '0.240', 'weapon4': '0.502', 'ARMOR': '0.504', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.825', 'weapon2': '1.196', 'weapon3': '1.692', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:45,866][63771] DAMAGECOUNT value on done: 3807.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:46,023][63732] Updated weights for policy 0, policy_version 1160 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:46,204][63771] DAMAGECOUNT value on done: 3263.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:46,204][63771] Sum rewards: -0.519, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.582', 'AMMO2': '0.016', 'ARMOR': '0.056', 'AMMO4': '0.081', 'AMMO3': '0.141', 'WEAPON4': '0.200', 'HITCOUNT': '0.240', 'weapon4': '0.242', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.792', 'weapon3': '1.408', 'weapon2': '1.636', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:46,349][63767] DAMAGECOUNT value on done: 6172.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:46,350][63767] Sum rewards: -3.571, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.057', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'weapon5': '0.034', 'ARMOR': '0.064', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.132', 'AMMO3': '0.133', 'HITCOUNT': '0.230', 'DAMAGECOUNT': '0.723', 'WEAPON3': '0.900', 'weapon2': '1.248', 'weapon3': '1.810', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:46,588][63771] DAMAGECOUNT value on done: 5147.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:46,589][63771] Sum rewards: -4.515, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.130', 'AMMO2': '0.002', 'AMMO5': '0.003', 'AMMO4': '0.011', 'weapon5': '0.026', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'AMMO3': '0.180', 'HITCOUNT': '0.180', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.800', 'weapon3': '1.112', 'FRAGCOUNT': '2.000', 'weapon2': '2.066'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:46,739][63767] DAMAGECOUNT value on done: 6213.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:47,458][109198] Fps is (10 sec: 10649.6, 60 sec: 11127.5, 300 sec: 11135.6). Total num frames: 9502720. Throughput: 0: 1561.1, 1: 1212.8. Samples: 2367918. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:47,460][109198] Avg episode reward: [(0, '-2.164'), (1, '-4.397')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:48,384][63733] Updated weights for policy 1, policy_version 1160 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:48,443][63769] DAMAGECOUNT value on done: 4265.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:48,675][63767] DAMAGECOUNT value on done: 7293.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:48,676][63767] Sum rewards: 1.155, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.044', 'AMMO2': '0.010', 'AMMO5': '0.012', 'ARMOR': '0.026', 'AMMO4': '0.048', 'weapon5': '0.070', 'WEAPON4': '0.100', 'weapon4': '0.100', 'AMMO3': '0.146', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.915', 'weapon3': '1.562', 'weapon2': '1.850', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:48,842][63769] DAMAGECOUNT value on done: 6055.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:48,843][63769] Sum rewards: -0.719, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.064', 'AMMO4': '-0.046', 'AMMO2': '-0.009', 'ARMOR': '0.008', 'AMMO3': '0.096', 'HITCOUNT': '0.140', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.660', 'FRAGCOUNT': '1.000', 'weapon3': '1.528', 'weapon2': '1.568'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:49,022][63767] DAMAGECOUNT value on done: 6907.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:49,022][63767] Sum rewards: -1.736, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.995', 'AMMO5': '0.012', 'AMMO2': '0.013', 'WEAPON1': '0.020', 'weapon4': '0.042', 'AMMO4': '0.067', 'WEAPON4': '0.100', 'weapon5': '0.130', 'AMMO3': '0.192', 'HITCOUNT': '0.230', 'WEAPON5': '0.250', 'ARMOR': '0.432', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.230', 'weapon2': '1.536', 'weapon3': '1.954', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:51,292][63770] DAMAGECOUNT value on done: 6291.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:51,292][63770] Sum rewards: -4.350, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.940', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.018', 'AMMO5': '0.019', 'WEAPON1': '0.030', 'AMMO4': '0.089', 'AMMO3': '0.138', 'weapon5': '0.184', 'HITCOUNT': '0.190', 'WEAPON5': '0.300', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.714', 'weapon2': '1.484', 'weapon3': '1.524'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:51,696][63770] DAMAGECOUNT value on done: 3533.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:51,696][63770] Sum rewards: -5.572, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.203', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'AMMO5': '0.003', 'weapon4': '0.012', 'WEAPON4': '0.050', 'ARMOR': '0.060', 'AMMO3': '0.163', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.585', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.592', 'weapon3': '1.766'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:52,458][109198] Fps is (10 sec: 10649.5, 60 sec: 11059.2, 300 sec: 11135.6). Total num frames: 9555968. Throughput: 0: 1549.1, 1: 1203.3. Samples: 2383737. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:52,460][109198] Avg episode reward: [(0, '-2.140'), (1, '-4.354')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:52,462][63576] Saving new best policy, reward=-4.354!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:52,835][63732] Updated weights for policy 0, policy_version 1170 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:55,246][63735] DAMAGECOUNT value on done: 5423.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:55,246][63735] Sum rewards: -2.931, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.240', 'AMMO2': '0.009', 'ARMOR': '0.044', 'AMMO4': '0.046', 'AMMO3': '0.120', 'weapon4': '0.164', 'WEAPON4': '0.200', 'HITCOUNT': '0.270', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.945', 'FRAGCOUNT': '1.000', 'weapon2': '1.492', 'weapon3': '1.668'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:55,688][63735] DAMAGECOUNT value on done: 5436.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:55,689][63735] Sum rewards: -2.599, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.558', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.010', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'AMMO4': '0.049', 'AMMO3': '0.123', 'HITCOUNT': '0.230', 'WEAPON5': '0.300', 'weapon5': '0.324', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.116', 'weapon3': '1.434', 'weapon2': '1.600'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:57,261][63733] Updated weights for policy 1, policy_version 1170 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:57,458][109198] Fps is (10 sec: 10649.6, 60 sec: 10990.9, 300 sec: 11121.7). Total num frames: 9609216. Throughput: 0: 1540.8, 1: 1199.0. Samples: 2399728. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:50:57,460][109198] Avg episode reward: [(0, '-2.138'), (1, '-4.400')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:58,978][63806] DAMAGECOUNT value on done: 5402.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:59,083][63805] DAMAGECOUNT value on done: 6971.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:59,084][63805] Sum rewards: -1.655, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.704', 'AMMO2': '0.007', 'AMMO5': '0.013', 'AMMO4': '0.033', 'weapon7': '0.064', 'ARMOR': '0.088', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.100', 'weapon5': '0.102', 'AMMO3': '0.136', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'HITCOUNT': '0.290', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.870', 'FRAGCOUNT': '1.000', 'weapon2': '1.252', 'weapon3': '1.874'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:59,319][63806] DAMAGECOUNT value on done: 5288.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:59,320][63806] Sum rewards: -0.461, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.762', 'AMMO2': '0.005', 'AMMO5': '0.005', 'weapon5': '0.016', 'AMMO4': '0.024', 'WEAPON1': '0.030', 'WEAPON5': '0.100', 'AMMO3': '0.117', 'HITCOUNT': '0.140', 'DAMAGECOUNT': '0.306', 'ARMOR': '0.564', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.098', 'weapon3': '1.496'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:59,436][63805] DAMAGECOUNT value on done: 4338.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:59,437][63805] Sum rewards: -5.589, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.110', 'AMMO2': '0.003', 'AMMO4': '0.014', 'ARMOR': '0.028', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.138', 'AMMO3': '0.159', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.900', 'weapon2': '1.306', 'weapon3': '1.618', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:50:59,596][63732] Updated weights for policy 0, policy_version 1180 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:00,702][63735] DAMAGECOUNT value on done: 5398.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:01,105][63735] DAMAGECOUNT value on done: 3475.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:01,106][63735] Sum rewards: -1.493, reward structure: {'DEATHCOUNT': '-9.750', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'ARMOR': '0.028', 'weapon5': '0.032', 'weapon4': '0.036', 'WEAPON4': '0.050', 'HEALTH': '0.070', 'AMMO4': '0.086', 'WEAPON5': '0.100', 'AMMO3': '0.122', 'HITCOUNT': '0.250', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.029', 'weapon3': '1.544', 'weapon2': '1.728', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:02,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11059.2, 300 sec: 11135.6). Total num frames: 9666560. Throughput: 0: 1540.3, 1: 1200.4. Samples: 2408137. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:02,460][109198] Avg episode reward: [(0, '-2.122'), (1, '-4.366')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:03,070][63770] DAMAGECOUNT value on done: 4704.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:03,472][63770] DAMAGECOUNT value on done: 4455.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:03,473][63770] Sum rewards: -9.683, reward structure: {'DEATHCOUNT': '-11.250', 'FRAGCOUNT': '-3.000', 'HEALTH': '-0.188', 'weapon4': '0.002', 'WEAPON1': '0.010', 'AMMO2': '0.013', 'AMMO5': '0.014', 'ARMOR': '0.028', 'HITCOUNT': '0.050', 'AMMO4': '0.062', 'weapon5': '0.096', 'WEAPON4': '0.100', 'AMMO3': '0.119', 'DAMAGECOUNT': '0.135', 'WEAPON5': '0.200', 'WEAPON3': '0.700', 'weapon3': '1.446', 'weapon2': '1.780'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:04,418][63734] DAMAGECOUNT value on done: 4851.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:04,419][63734] Sum rewards: -6.789, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.880', 'AMMO2': '0.002', 'AMMO4': '0.011', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'WEAPON4': '0.100', 'AMMO3': '0.132', 'weapon4': '0.134', 'weapon5': '0.154', 'HITCOUNT': '0.200', 'WEAPON5': '0.250', 'ARMOR': '0.490', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.579', 'WEAPON3': '0.600', 'weapon2': '1.404', 'weapon3': '1.752'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:04,433][63806] DAMAGECOUNT value on done: 4569.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:04,434][63806] Sum rewards: -6.874, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.506', 'AMMO5': '0.005', 'AMMO2': '0.008', 'ARMOR': '0.010', 'weapon5': '0.016', 'AMMO4': '0.042', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'weapon4': '0.138', 'HITCOUNT': '0.150', 'AMMO3': '0.159', 'DAMAGECOUNT': '0.600', 'WEAPON3': '1.000', 'weapon2': '1.602', 'weapon3': '1.752', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:04,769][63734] DAMAGECOUNT value on done: 4194.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:04,769][63734] Sum rewards: -7.217, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.452', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.005', 'AMMO5': '0.013', 'AMMO4': '0.025', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'weapon4': '0.118', 'HITCOUNT': '0.150', 'AMMO3': '0.180', 'weapon5': '0.198', 'WEAPON5': '0.300', 'ARMOR': '0.466', 'DAMAGECOUNT': '0.471', 'WEAPON3': '0.800', 'weapon3': '1.572', 'weapon2': '1.596'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:04,852][63806] DAMAGECOUNT value on done: 6520.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:04,853][63806] Sum rewards: -3.402, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.786', 'AMMO5': '0.007', 'AMMO2': '0.019', 'WEAPON1': '0.020', 'ARMOR': '0.044', 'WEAPON4': '0.050', 'HITCOUNT': '0.060', 'AMMO4': '0.097', 'WEAPON5': '0.150', 'AMMO3': '0.156', 'weapon4': '0.162', 'weapon5': '0.272', 'DAMAGECOUNT': '0.795', 'WEAPON3': '0.800', 'weapon2': '1.312', 'FRAGCOUNT': '1.500', 'weapon3': '1.690'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:05,672][63733] Updated weights for policy 1, policy_version 1180 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:06,148][63732] Updated weights for policy 0, policy_version 1190 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:06,152][63769] DAMAGECOUNT value on done: 6293.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:06,152][63769] Sum rewards: 0.424, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.450', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.020', 'ARMOR': '0.032', 'weapon5': '0.044', 'WEAPON4': '0.050', 'weapon7': '0.080', 'AMMO6': '0.100', 'AMMO7': '0.100', 'HITCOUNT': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.140', 'weapon4': '0.198', 'WEAPON5': '0.400', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.960', 'weapon2': '1.322', 'weapon3': '1.824', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:06,492][63769] DAMAGECOUNT value on done: 4266.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:06,493][63769] Sum rewards: 0.015, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.463', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'WEAPON4': '0.050', 'ARMOR': '0.076', 'weapon4': '0.106', 'AMMO3': '0.142', 'HITCOUNT': '0.300', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.293', 'weapon2': '1.528', 'weapon3': '1.690', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:07,458][109198] Fps is (10 sec: 11059.3, 60 sec: 10990.9, 300 sec: 11121.7). Total num frames: 9719808. Throughput: 0: 1540.7, 1: 1200.0. Samples: 2424771. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:07,460][109198] Avg episode reward: [(0, '-2.200'), (1, '-4.470')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:08,962][63767] DAMAGECOUNT value on done: 6465.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:08,963][63767] Sum rewards: -1.232, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.330', 'AMMO4': '-0.040', 'AMMO2': '-0.008', 'AMMO5': '0.012', 'weapon5': '0.052', 'AMMO3': '0.099', 'WEAPON5': '0.150', 'HITCOUNT': '0.220', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.879', 'weapon3': '1.138', 'weapon2': '1.796', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:09,346][63767] DAMAGECOUNT value on done: 6228.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:09,521][63805] DAMAGECOUNT value on done: 6500.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:09,522][63805] Sum rewards: 0.257, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.038', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.015', 'weapon7': '0.070', 'AMMO4': '0.073', 'weapon5': '0.076', 'AMMO3': '0.106', 'HITCOUNT': '0.140', 'WEAPON4': '0.250', 'WEAPON5': '0.250', 'AMMO6': '0.320', 'AMMO7': '0.320', 'weapon4': '0.340', 'WEAPON7': '0.400', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.552', 'FRAGCOUNT': '1.000', 'weapon3': '1.272', 'weapon2': '1.588'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:09,687][63771] DAMAGECOUNT value on done: 3413.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:09,687][63771] Sum rewards: -5.030, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.038', 'AMMO2': '0.016', 'ARMOR': '0.028', 'AMMO4': '0.079', 'AMMO3': '0.131', 'HITCOUNT': '0.140', 'WEAPON4': '0.300', 'weapon4': '0.328', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.850', 'weapon3': '1.396', 'weapon2': '1.790', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:09,875][63805] DAMAGECOUNT value on done: 5861.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:09,876][63805] Sum rewards: -2.412, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.946', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.016', 'WEAPON5': '0.050', 'AMMO4': '0.081', 'AMMO3': '0.084', 'WEAPON4': '0.100', 'HITCOUNT': '0.200', 'weapon4': '0.308', 'ARMOR': '0.448', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.654', 'weapon3': '1.288', 'weapon2': '1.540', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:10,071][63771] DAMAGECOUNT value on done: 5401.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:10,071][63771] Sum rewards: -3.258, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.025', 'AMMO4': '-0.051', 'AMMO2': '-0.010', 'weapon4': '0.042', 'ARMOR': '0.072', 'AMMO3': '0.096', 'WEAPON4': '0.100', 'HITCOUNT': '0.260', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.762', 'weapon3': '1.296', 'weapon2': '1.850', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:10,148][63734] DAMAGECOUNT value on done: 6348.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:10,149][63734] Sum rewards: -0.885, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.848', 'AMMO2': '0.001', 'AMMO5': '0.003', 'AMMO4': '0.003', 'weapon5': '0.040', 'WEAPON5': '0.050', 'AMMO3': '0.088', 'HITCOUNT': '0.240', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.900', 'weapon3': '1.154', 'weapon2': '1.734', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:10,475][63734] DAMAGECOUNT value on done: 4832.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:10,475][63734] Sum rewards: -8.858, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-3.000', 'HEALTH': '-1.488', 'AMMO4': '-0.020', 'AMMO2': '-0.004', 'AMMO5': '0.017', 'ARMOR': '0.060', 'HITCOUNT': '0.130', 'weapon5': '0.166', 'AMMO3': '0.176', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.378', 'WEAPON3': '1.050', 'weapon2': '1.468', 'weapon3': '1.708'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:11,288][63771] DAMAGECOUNT value on done: 6233.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:11,288][63771] Sum rewards: -1.610, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.598', 'AMMO4': '-0.029', 'AMMO2': '-0.006', 'AMMO5': '0.009', 'WEAPON1': '0.030', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.100', 'AMMO3': '0.127', 'weapon5': '0.176', 'WEAPON5': '0.200', 'HITCOUNT': '0.360', 'WEAPON3': '0.800', 'weapon2': '1.320', 'DAMAGECOUNT': '1.623', 'weapon3': '1.728', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:11,753][63771] DAMAGECOUNT value on done: 4342.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:11,753][63771] Sum rewards: -1.453, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.654', 'AMMO5': '0.005', 'AMMO2': '0.009', 'WEAPON1': '0.020', 'AMMO4': '0.045', 'WEAPON5': '0.050', 'AMMO3': '0.127', 'HITCOUNT': '0.380', 'WEAPON3': '0.750', 'weapon3': '1.446', 'weapon2': '1.514', 'DAMAGECOUNT': '1.605', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:11,995][63767] DAMAGECOUNT value on done: 7426.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:11,995][63767] Sum rewards: -4.387, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.690', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.007', 'weapon5': '0.008', 'AMMO2': '0.011', 'AMMO4': '0.054', 'AMMO3': '0.110', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'weapon4': '0.340', 'DAMAGECOUNT': '0.399', 'WEAPON3': '0.650', 'weapon3': '1.200', 'weapon2': '1.834'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:12,388][63767] DAMAGECOUNT value on done: 7120.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:12,388][63767] Sum rewards: -4.365, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.280', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.017', 'ARMOR': '0.040', 'WEAPON1': '0.040', 'weapon5': '0.080', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON4': '0.100', 'weapon7': '0.128', 'AMMO3': '0.157', 'HITCOUNT': '0.160', 'weapon4': '0.326', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.639', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.124', 'weapon2': '1.564'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:12,458][109198] Fps is (10 sec: 10649.5, 60 sec: 10922.7, 300 sec: 11107.8). Total num frames: 9773056. Throughput: 0: 1533.9, 1: 1195.5. Samples: 2441103. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:12,460][109198] Avg episode reward: [(0, '-2.291'), (1, '-4.307')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:12,462][63576] Saving new best policy, reward=-4.307!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:12,806][63732] Updated weights for policy 0, policy_version 1200 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:14,298][63769] DAMAGECOUNT value on done: 4369.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:14,298][63769] Sum rewards: -2.275, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.842', 'AMMO5': '0.007', 'weapon7': '0.012', 'AMMO2': '0.016', 'WEAPON1': '0.030', 'weapon5': '0.076', 'AMMO4': '0.078', 'ARMOR': '0.080', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.145', 'WEAPON5': '0.150', 'weapon4': '0.178', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'DAMAGECOUNT': '0.312', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.260', 'weapon2': '1.962'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:14,305][63733] Updated weights for policy 1, policy_version 1190 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:14,636][63769] DAMAGECOUNT value on done: 6170.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:14,636][63769] Sum rewards: -5.294, reward structure: {'DEATHCOUNT': '-11.250', 'AMMO2': '0.008', 'AMMO4': '0.041', 'WEAPON4': '0.050', 'HITCOUNT': '0.080', 'HEALTH': '0.138', 'AMMO3': '0.158', 'DAMAGECOUNT': '0.345', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.624', 'weapon2': '1.762'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:17,059][63770] DAMAGECOUNT value on done: 6541.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:17,060][63770] Sum rewards: -2.261, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.729', 'AMMO5': '0.013', 'AMMO2': '0.015', 'ARMOR': '0.028', 'weapon5': '0.038', 'AMMO4': '0.074', 'weapon7': '0.092', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.105', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.380', 'weapon2': '1.954'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:17,458][109198] Fps is (10 sec: 11058.9, 60 sec: 10990.9, 300 sec: 11121.7). Total num frames: 9830400. Throughput: 0: 1528.9, 1: 1191.5. Samples: 2449055. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:17,461][109198] Avg episode reward: [(0, '-2.251'), (1, '-4.362')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:17,464][63770] DAMAGECOUNT value on done: 3838.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:17,465][63770] Sum rewards: -2.496, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.030', 'weapon5': '0.004', 'ARMOR': '0.004', 'AMMO2': '0.004', 'AMMO5': '0.013', 'AMMO4': '0.022', 'weapon4': '0.082', 'WEAPON4': '0.100', 'AMMO3': '0.116', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.915', 'weapon2': '1.336', 'weapon3': '1.778', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:19,569][63732] Updated weights for policy 0, policy_version 1210 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:20,250][63735] DAMAGECOUNT value on done: 5528.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:20,251][63735] Sum rewards: -4.315, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.753', 'AMMO2': '0.007', 'AMMO4': '0.035', 'WEAPON4': '0.050', 'weapon4': '0.060', 'HITCOUNT': '0.080', 'AMMO3': '0.161', 'DAMAGECOUNT': '0.315', 'ARMOR': '0.472', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.288', 'weapon3': '2.020'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:20,565][63735] DAMAGECOUNT value on done: 5573.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:20,565][63735] Sum rewards: -3.093, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.706', 'AMMO2': '0.005', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.026', 'WEAPON4': '0.050', 'weapon5': '0.054', 'AMMO3': '0.121', 'HITCOUNT': '0.160', 'weapon4': '0.160', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.411', 'WEAPON3': '0.600', 'ARMOR': '0.851', 'weapon2': '1.416', 'weapon3': '1.774'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:22,236][63806] DAMAGECOUNT value on done: 5586.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:22,237][63806] Sum rewards: -7.161, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.528', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO2': '0.023', 'weapon5': '0.034', 'AMMO4': '0.112', 'weapon4': '0.126', 'HITCOUNT': '0.170', 'AMMO3': '0.182', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'ARMOR': '0.412', 'DAMAGECOUNT': '0.552', 'WEAPON3': '1.000', 'weapon2': '1.290', 'weapon3': '1.734'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:22,458][109198] Fps is (10 sec: 11059.3, 60 sec: 10922.7, 300 sec: 11121.7). Total num frames: 9883648. Throughput: 0: 1532.3, 1: 1192.5. Samples: 2465758. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:22,460][109198] Avg episode reward: [(0, '-2.258'), (1, '-4.299')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:22,462][63576] Saving new best policy, reward=-4.299!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:22,558][63806] DAMAGECOUNT value on done: 5456.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:22,558][63806] Sum rewards: -1.461, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.410', 'AMMO5': '0.012', 'AMMO2': '0.014', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO4': '0.069', 'AMMO3': '0.121', 'HITCOUNT': '0.170', 'weapon4': '0.186', 'weapon5': '0.224', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.504', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.264', 'weapon3': '1.820'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:22,777][63733] Updated weights for policy 1, policy_version 1200 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:24,141][63805] DAMAGECOUNT value on done: 7265.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:24,141][63805] Sum rewards: -2.931, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.008', 'AMMO5': '0.012', 'HEALTH': '0.018', 'ARMOR': '0.028', 'AMMO4': '0.038', 'weapon5': '0.108', 'AMMO3': '0.142', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.882', 'weapon2': '1.346', 'weapon3': '2.136'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:24,546][63805] DAMAGECOUNT value on done: 4387.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:25,692][63735] DAMAGECOUNT value on done: 5912.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:25,692][63735] Sum rewards: -4.367, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-3.060', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'AMMO3': '0.135', 'weapon4': '0.180', 'HITCOUNT': '0.200', 'weapon5': '0.238', 'WEAPON5': '0.300', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.113', 'weapon2': '1.258', 'FRAGCOUNT': '1.500', 'weapon3': '1.768'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:26,031][63732] Updated weights for policy 0, policy_version 1220 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:26,091][63735] DAMAGECOUNT value on done: 3641.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:26,091][63735] Sum rewards: -1.231, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.110', 'AMMO4': '-0.072', 'AMMO2': '-0.014', 'AMMO5': '0.012', 'weapon5': '0.060', 'AMMO3': '0.092', 'HITCOUNT': '0.100', 'WEAPON5': '0.150', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.498', 'weapon3': '1.098', 'weapon2': '1.504', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:27,458][109198] Fps is (10 sec: 11059.4, 60 sec: 10922.7, 300 sec: 11121.7). Total num frames: 9940992. Throughput: 0: 1533.6, 1: 1194.7. Samples: 2482383. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:27,460][109198] Avg episode reward: [(0, '-2.307'), (1, '-4.296')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:27,468][63576] Saving new best policy, reward=-4.296!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:28,209][63734] DAMAGECOUNT value on done: 5131.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:28,210][63734] Sum rewards: -4.008, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.270', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'weapon5': '0.026', 'ARMOR': '0.028', 'WEAPON4': '0.050', 'AMMO4': '0.083', 'WEAPON5': '0.100', 'AMMO3': '0.109', 'weapon4': '0.194', 'HITCOUNT': '0.270', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.840', 'weapon2': '1.356', 'weapon3': '1.822'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:28,571][63734] DAMAGECOUNT value on done: 4414.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:28,572][63734] Sum rewards: -4.895, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.712', 'AMMO2': '0.019', 'WEAPON1': '0.020', 'AMMO4': '0.092', 'AMMO3': '0.154', 'HITCOUNT': '0.200', 'WEAPON4': '0.300', 'ARMOR': '0.480', 'weapon4': '0.654', 'DAMAGECOUNT': '0.660', 'WEAPON3': '0.850', 'weapon2': '1.408', 'weapon3': '1.480', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:28,766][63770] DAMAGECOUNT value on done: 4808.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:29,110][63770] DAMAGECOUNT value on done: 4814.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:29,110][63770] Sum rewards: -1.928, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.320', 'AMMO5': '0.016', 'AMMO2': '0.017', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.087', 'weapon4': '0.088', 'AMMO3': '0.157', 'HITCOUNT': '0.180', 'weapon5': '0.282', 'WEAPON5': '0.300', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.077', 'weapon3': '1.290', 'weapon2': '1.778', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:29,237][63806] DAMAGECOUNT value on done: 4598.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:29,679][63806] DAMAGECOUNT value on done: 6774.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:29,679][63806] Sum rewards: -1.113, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.345', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.003', 'ARMOR': '0.068', 'weapon7': '0.074', 'AMMO3': '0.077', 'weapon5': '0.090', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.110', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.160', 'WEAPON7': '0.200', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.762', 'FRAGCOUNT': '1.000', 'weapon3': '1.036', 'weapon2': '1.658'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:30,149][63769] DAMAGECOUNT value on done: 6398.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:30,149][63769] Sum rewards: -10.214, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.666', 'FRAGCOUNT': '-1.500', 'AMMO2': '0.009', 'weapon4': '0.014', 'AMMO5': '0.023', 'ARMOR': '0.028', 'AMMO4': '0.044', 'WEAPON4': '0.100', 'weapon5': '0.134', 'HITCOUNT': '0.140', 'AMMO3': '0.223', 'DAMAGECOUNT': '0.315', 'WEAPON5': '0.350', 'WEAPON3': '1.150', 'weapon2': '1.266', 'weapon3': '2.156'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:30,513][63769] DAMAGECOUNT value on done: 4374.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:30,513][63769] Sum rewards: -3.977, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'ARMOR': '0.016', 'AMMO5': '0.016', 'AMMO4': '0.035', 'WEAPON4': '0.050', 'weapon5': '0.076', 'AMMO3': '0.110', 'HITCOUNT': '0.120', 'weapon4': '0.148', 'HEALTH': '0.174', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.324', 'WEAPON3': '0.450', 'weapon2': '1.438', 'weapon3': '1.798'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:31,225][63733] Updated weights for policy 1, policy_version 1210 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:31,593][63767] DAMAGECOUNT value on done: 6590.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:31,594][63767] Sum rewards: -2.416, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.695', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.001', 'AMMO5': '0.003', 'AMMO4': '0.005', 'WEAPON1': '0.030', 'WEAPON5': '0.050', 'weapon5': '0.060', 'AMMO3': '0.110', 'HITCOUNT': '0.140', 'DAMAGECOUNT': '0.375', 'ARMOR': '0.447', 'WEAPON3': '0.500', 'weapon2': '1.498', 'weapon3': '1.560'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:31,943][63767] DAMAGECOUNT value on done: 6403.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:31,944][63767] Sum rewards: -5.558, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.955', 'AMMO2': '0.003', 'AMMO5': '0.008', 'WEAPON1': '0.010', 'AMMO4': '0.013', 'weapon5': '0.016', 'ARMOR': '0.020', 'AMMO3': '0.096', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.160', 'weapon4': '0.206', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.525', 'weapon3': '1.378', 'weapon2': '1.512'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:32,458][109198] Fps is (10 sec: 11059.0, 60 sec: 10922.6, 300 sec: 11121.7). Total num frames: 9994240. Throughput: 0: 1532.0, 1: 1193.2. Samples: 2490551. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:32,460][109198] Avg episode reward: [(0, '-2.491'), (1, '-4.221')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:32,460][63771] DAMAGECOUNT value on done: 3470.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:32,460][63771] Sum rewards: -4.938, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.316', 'AMMO4': '-0.033', 'AMMO2': '-0.007', 'AMMO5': '0.005', 'weapon5': '0.008', 'ARMOR': '0.024', 'HITCOUNT': '0.060', 'WEAPON5': '0.100', 'AMMO3': '0.133', 'DAMAGECOUNT': '0.171', 'weapon2': '0.766', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '2.400'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:32,462][63576] Saving new best policy, reward=-4.221!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:32,725][63732] Updated weights for policy 0, policy_version 1230 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:32,771][63771] DAMAGECOUNT value on done: 5621.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:32,772][63771] Sum rewards: -4.839, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.130', 'AMMO5': '0.003', 'AMMO2': '0.025', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'weapon4': '0.084', 'weapon5': '0.086', 'WEAPON4': '0.100', 'AMMO4': '0.123', 'AMMO3': '0.128', 'HITCOUNT': '0.200', 'DAMAGECOUNT': '0.660', 'WEAPON3': '0.900', 'weapon2': '1.524', 'weapon3': '1.864', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:34,660][63805] DAMAGECOUNT value on done: 6787.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:34,661][63805] Sum rewards: 2.588, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.062', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'weapon7': '0.002', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO3': '0.073', 'weapon5': '0.122', 'HITCOUNT': '0.190', 'WEAPON4': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.350', 'weapon4': '0.442', 'ARMOR': '0.519', 'DAMAGECOUNT': '0.861', 'weapon3': '1.058', 'weapon2': '1.662', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:34,999][63805] DAMAGECOUNT value on done: 5951.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:34,999][63805] Sum rewards: -4.068, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.448', 'AMMO5': '0.005', 'AMMO2': '0.015', 'WEAPON4': '0.050', 'AMMO4': '0.073', 'HITCOUNT': '0.080', 'weapon4': '0.104', 'AMMO3': '0.135', 'DAMAGECOUNT': '0.270', 'ARMOR': '0.472', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.488', 'weapon2': '1.738'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:35,424][63734] DAMAGECOUNT value on done: 6403.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:35,425][63734] Sum rewards: -4.329, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.240', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'weapon5': '0.048', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.056', 'HITCOUNT': '0.060', 'ARMOR': '0.062', 'AMMO3': '0.126', 'weapon4': '0.142', 'DAMAGECOUNT': '0.165', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.700', 'weapon3': '1.428', 'weapon2': '1.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:35,456][63767] DAMAGECOUNT value on done: 7616.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:35,456][63767] Sum rewards: -1.256, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.774', 'AMMO4': '-0.060', 'AMMO2': '-0.012', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'ARMOR': '0.020', 'AMMO3': '0.105', 'HITCOUNT': '0.180', 'weapon5': '0.224', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.700', 'weapon2': '1.316', 'weapon3': '1.954', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:35,816][63767] DAMAGECOUNT value on done: 7460.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:35,817][63767] Sum rewards: -2.475, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.332', 'FRAGCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.009', 'AMMO4': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'weapon5': '0.048', 'AMMO3': '0.166', 'WEAPON5': '0.200', 'HITCOUNT': '0.240', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.020', 'weapon2': '1.392', 'weapon3': '1.604'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:35,836][63734] DAMAGECOUNT value on done: 5326.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:35,837][63734] Sum rewards: 1.929, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.116', 'AMMO4': '-0.055', 'AMMO2': '-0.011', 'AMMO5': '0.007', 'WEAPON1': '0.030', 'AMMO3': '0.143', 'WEAPON5': '0.150', 'weapon5': '0.156', 'HITCOUNT': '0.190', 'ARMOR': '0.484', 'WEAPON3': '0.600', 'weapon2': '1.064', 'DAMAGECOUNT': '1.482', 'weapon3': '1.804', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:36,455][63771] DAMAGECOUNT value on done: 6728.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:36,456][63771] Sum rewards: -5.587, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.832', 'AMMO2': '0.002', 'AMMO4': '0.008', 'ARMOR': '0.020', 'AMMO5': '0.023', 'weapon5': '0.050', 'AMMO3': '0.174', 'WEAPON5': '0.200', 'HITCOUNT': '0.360', 'WEAPON3': '0.900', 'weapon2': '1.328', 'DAMAGECOUNT': '1.485', 'FRAGCOUNT': '1.500', 'weapon3': '2.196'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:36,852][63771] DAMAGECOUNT value on done: 4565.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:36,853][63771] Sum rewards: -5.582, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.318', 'AMMO2': '0.007', 'AMMO4': '0.033', 'ARMOR': '0.096', 'AMMO3': '0.139', 'HITCOUNT': '0.200', 'DAMAGECOUNT': '0.669', 'WEAPON3': '0.750', 'weapon2': '1.412', 'weapon3': '1.680', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:37,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10922.7, 300 sec: 11121.7). Total num frames: 10051584. Throughput: 0: 1538.8, 1: 1199.9. Samples: 2506982. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:37,460][109198] Avg episode reward: [(0, '-2.539'), (1, '-4.228')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:39,297][63732] Updated weights for policy 0, policy_version 1240 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:39,521][63769] DAMAGECOUNT value on done: 4718.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:39,521][63769] Sum rewards: -1.361, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.020', 'AMMO2': '0.008', 'AMMO4': '0.038', 'ARMOR': '0.048', 'WEAPON4': '0.100', 'AMMO3': '0.124', 'weapon4': '0.140', 'HITCOUNT': '0.290', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.047', 'weapon3': '1.596', 'weapon2': '1.768', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:39,742][63733] Updated weights for policy 1, policy_version 1220 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:39,940][63769] DAMAGECOUNT value on done: 6409.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:39,941][63769] Sum rewards: -2.478, reward structure: {'DEATHCOUNT': '-10.500', 'AMMO5': '0.003', 'weapon5': '0.014', 'AMMO2': '0.024', 'WEAPON5': '0.050', 'HEALTH': '0.054', 'ARMOR': '0.112', 'AMMO4': '0.118', 'AMMO3': '0.134', 'HITCOUNT': '0.260', 'WEAPON4': '0.300', 'weapon4': '0.304', 'DAMAGECOUNT': '0.717', 'WEAPON3': '0.800', 'weapon2': '1.286', 'weapon3': '1.846', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:42,458][109198] Fps is (10 sec: 11059.3, 60 sec: 10922.7, 300 sec: 11107.8). Total num frames: 10104832. Throughput: 0: 1546.8, 1: 1205.8. Samples: 2523597. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:42,460][109198] Avg episode reward: [(0, '-2.577'), (1, '-4.253')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:42,703][63770] DAMAGECOUNT value on done: 6855.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:43,123][63770] DAMAGECOUNT value on done: 4003.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:43,123][63770] Sum rewards: -4.399, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.298', 'AMMO2': '0.001', 'AMMO4': '0.005', 'weapon5': '0.012', 'AMMO5': '0.017', 'AMMO3': '0.082', 'HITCOUNT': '0.110', 'WEAPON5': '0.250', 'ARMOR': '0.400', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.330', 'weapon2': '1.696'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:44,995][63735] DAMAGECOUNT value on done: 5627.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:45,371][63735] DAMAGECOUNT value on done: 5801.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:45,371][63735] Sum rewards: -6.165, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.701', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.010', 'AMMO5': '0.029', 'AMMO4': '0.048', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'AMMO3': '0.116', 'weapon5': '0.134', 'weapon4': '0.242', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.684', 'WEAPON3': '0.750', 'ARMOR': '0.949', 'weapon2': '1.236', 'weapon3': '1.748'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:45,380][63806] DAMAGECOUNT value on done: 5895.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:45,381][63806] Sum rewards: -2.325, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.212', 'AMMO2': '0.002', 'AMMO4': '0.007', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'AMMO5': '0.028', 'weapon5': '0.090', 'AMMO3': '0.138', 'HITCOUNT': '0.270', 'WEAPON5': '0.450', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.927', 'weapon2': '1.530', 'weapon3': '1.652', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:45,734][63806] DAMAGECOUNT value on done: 5782.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:45,734][63806] Sum rewards: -1.147, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.660', 'AMMO2': '0.012', 'weapon4': '0.016', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.061', 'AMMO3': '0.099', 'WEAPON4': '0.100', 'HITCOUNT': '0.190', 'WEAPON5': '0.400', 'weapon5': '0.438', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.978', 'weapon3': '1.278', 'weapon2': '1.722', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:45,991][63732] Updated weights for policy 0, policy_version 1250 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:47,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10990.9, 300 sec: 11107.8). Total num frames: 10162176. Throughput: 0: 1544.4, 1: 1204.0. Samples: 2531815. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:47,460][109198] Avg episode reward: [(0, '-2.573'), (1, '-4.243')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:48,128][63733] Updated weights for policy 1, policy_version 1230 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:48,887][63769] Large shaping reward -2.504 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.255, -85.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:49,210][63805] DAMAGECOUNT value on done: 7518.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:49,567][63805] DAMAGECOUNT value on done: 4510.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:49,568][63805] Sum rewards: -4.132, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.396', 'AMMO2': '0.001', 'AMMO4': '0.002', 'AMMO5': '0.005', 'ARMOR': '0.020', 'weapon5': '0.020', 'WEAPON5': '0.100', 'HITCOUNT': '0.120', 'AMMO3': '0.143', 'WEAPON4': '0.200', 'weapon4': '0.230', 'DAMAGECOUNT': '0.369', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.346', 'weapon2': '1.358'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:50,447][63735] DAMAGECOUNT value on done: 6217.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:50,448][63735] Sum rewards: -0.246, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.996', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.012', 'AMMO2': '0.026', 'AMMO4': '0.128', 'AMMO3': '0.133', 'weapon5': '0.176', 'WEAPON5': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon4': '0.270', 'HITCOUNT': '0.290', 'WEAPON4': '0.300', 'ARMOR': '0.492', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.915', 'weapon2': '1.126', 'weapon3': '1.832'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:50,863][63735] DAMAGECOUNT value on done: 3851.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:50,864][63735] Sum rewards: -3.702, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.578', 'AMMO5': '0.003', 'weapon5': '0.006', 'AMMO2': '0.011', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'WEAPON5': '0.050', 'AMMO4': '0.052', 'HITCOUNT': '0.140', 'AMMO3': '0.158', 'WEAPON4': '0.200', 'weapon4': '0.246', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.850', 'weapon3': '1.520', 'weapon2': '1.704', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:52,123][63734] DAMAGECOUNT value on done: 5480.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:52,123][63734] Sum rewards: 0.223, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.351', 'AMMO2': '0.008', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.040', 'weapon5': '0.060', 'ARMOR': '0.064', 'AMMO3': '0.194', 'WEAPON5': '0.200', 'HITCOUNT': '0.290', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.047', 'weapon2': '1.558', 'weapon3': '1.980', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:52,458][109198] Fps is (10 sec: 11059.1, 60 sec: 10990.9, 300 sec: 11107.8). Total num frames: 10215424. Throughput: 0: 1547.7, 1: 1205.1. Samples: 2548646. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:52,460][109198] Avg episode reward: [(0, '-2.440'), (1, '-4.305')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:52,482][63732] Updated weights for policy 0, policy_version 1260 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:52,517][63734] DAMAGECOUNT value on done: 4539.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:52,518][63734] Sum rewards: -5.045, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.908', 'AMMO5': '0.012', 'AMMO2': '0.023', 'ARMOR': '0.048', 'weapon5': '0.062', 'HITCOUNT': '0.080', 'WEAPON4': '0.100', 'AMMO4': '0.115', 'weapon4': '0.128', 'AMMO3': '0.162', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.375', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon2': '1.102', 'weapon3': '2.106'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:53,699][63806] DAMAGECOUNT value on done: 4683.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:53,780][63769] DAMAGECOUNT value on done: 6603.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:53,781][63769] Sum rewards: -0.750, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.768', 'AMMO2': '0.001', 'AMMO4': '0.002', 'AMMO5': '0.018', 'weapon7': '0.028', 'ARMOR': '0.032', 'AMMO3': '0.099', 'WEAPON4': '0.100', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'weapon5': '0.132', 'HITCOUNT': '0.150', 'weapon4': '0.206', 'WEAPON5': '0.300', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.615', 'weapon3': '1.402', 'weapon2': '1.532'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:53,785][63770] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:54,064][63806] DAMAGECOUNT value on done: 7000.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:54,065][63806] Sum rewards: -3.537, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.032', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'AMMO5': '0.022', 'AMMO4': '0.044', 'weapon5': '0.114', 'AMMO3': '0.128', 'HITCOUNT': '0.160', 'WEAPON4': '0.350', 'WEAPON5': '0.350', 'ARMOR': '0.512', 'weapon4': '0.524', 'DAMAGECOUNT': '0.678', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.416', 'weapon3': '1.478'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:54,110][63769] DAMAGECOUNT value on done: 4699.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:54,111][63769] Sum rewards: -0.150, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.010', 'HEALTH': '0.016', 'AMMO2': '0.020', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'weapon7': '0.074', 'AMMO4': '0.099', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.116', 'WEAPON5': '0.150', 'weapon4': '0.150', 'HITCOUNT': '0.160', 'weapon5': '0.160', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.975', 'weapon3': '1.412', 'FRAGCOUNT': '1.500', 'weapon2': '1.568'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:54,119][63767] DAMAGECOUNT value on done: 6715.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:54,119][63767] Sum rewards: -3.646, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.670', 'AMMO5': '0.007', 'weapon5': '0.008', 'AMMO2': '0.010', 'WEAPON1': '0.020', 'ARMOR': '0.035', 'AMMO4': '0.052', 'AMMO3': '0.104', 'HITCOUNT': '0.110', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'weapon4': '0.284', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.586', 'weapon2': '1.632'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:54,155][63770] DAMAGECOUNT value on done: 5055.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:54,155][63770] Sum rewards: -4.760, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.844', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.011', 'AMMO5': '0.012', 'weapon5': '0.032', 'WEAPON4': '0.050', 'AMMO4': '0.056', 'AMMO3': '0.110', 'HITCOUNT': '0.150', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.741', 'WEAPON3': '0.750', 'weapon2': '1.666', 'weapon3': '1.756'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:54,464][63767] DAMAGECOUNT value on done: 6575.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:54,464][63767] Sum rewards: -5.443, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.912', 'AMMO2': '0.008', 'AMMO5': '0.010', 'AMMO4': '0.038', 'weapon5': '0.064', 'ARMOR': '0.068', 'AMMO3': '0.119', 'weapon4': '0.126', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.516', 'WEAPON3': '0.850', 'weapon2': '1.430', 'weapon3': '1.470', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:54,569][63770] DAMAGECOUNT value on done: 5654.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:54,570][63770] Sum rewards: -2.362, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.940', 'AMMO4': '-0.042', 'AMMO2': '-0.008', 'AMMO5': '0.010', 'ARMOR': '0.015', 'weapon5': '0.076', 'weapon7': '0.104', 'HITCOUNT': '0.110', 'AMMO3': '0.141', 'WEAPON5': '0.200', 'AMMO6': '0.220', 'AMMO7': '0.220', 'WEAPON7': '0.300', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.020', 'weapon2': '1.200', 'FRAGCOUNT': '2.000', 'weapon3': '2.262'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:55,057][63771] DAMAGECOUNT value on done: 3480.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:55,440][63771] DAMAGECOUNT value on done: 5686.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:56,573][63733] Updated weights for policy 1, policy_version 1240 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:57,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11059.2, 300 sec: 11107.8). Total num frames: 10272768. Throughput: 0: 1551.0, 1: 1207.4. Samples: 2565227. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:51:57,460][109198] Avg episode reward: [(0, '-2.472'), (1, '-4.119')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:57,466][63576] Saving new best policy, reward=-4.119!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:58,825][63767] DAMAGECOUNT value on done: 7721.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:58,825][63767] Sum rewards: -3.001, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.972', 'AMMO2': '0.011', 'AMMO5': '0.018', 'WEAPON4': '0.050', 'AMMO4': '0.053', 'AMMO3': '0.108', 'HITCOUNT': '0.120', 'weapon5': '0.200', 'WEAPON5': '0.250', 'weapon4': '0.284', 'DAMAGECOUNT': '0.315', 'ARMOR': '0.528', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.074', 'weapon2': '1.610'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:59,089][63732] Updated weights for policy 0, policy_version 1270 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:59,190][63767] DAMAGECOUNT value on done: 7707.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:59,190][63767] Sum rewards: 1.112, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.036', 'AMMO5': '0.010', 'weapon4': '0.014', 'AMMO2': '0.016', 'weapon5': '0.018', 'WEAPON4': '0.050', 'AMMO4': '0.079', 'WEAPON5': '0.100', 'AMMO3': '0.124', 'HITCOUNT': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.741', 'ARMOR': '0.876', 'weapon2': '1.364', 'weapon3': '2.206', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:59,594][63805] DAMAGECOUNT value on done: 7252.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:51:59,595][63805] Sum rewards: -2.611, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.505', 'AMMO4': '-0.029', 'AMMO2': '-0.006', 'AMMO5': '0.010', 'weapon7': '0.050', 'WEAPON4': '0.100', 'weapon5': '0.116', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon4': '0.134', 'WEAPON5': '0.150', 'AMMO3': '0.163', 'WEAPON7': '0.200', 'HITCOUNT': '0.340', 'ARMOR': '0.536', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.150', 'weapon2': '1.340', 'DAMAGECOUNT': '1.395', 'weapon3': '2.004'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:00,011][63805] DAMAGECOUNT value on done: 6275.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:00,011][63805] Sum rewards: 0.567, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO2': '0.007', 'AMMO5': '0.008', 'WEAPON1': '0.020', 'AMMO4': '0.035', 'HEALTH': '0.082', 'weapon5': '0.100', 'AMMO3': '0.111', 'WEAPON5': '0.150', 'HITCOUNT': '0.280', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.972', 'weapon2': '1.412', 'weapon3': '1.590', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:00,899][63734] DAMAGECOUNT value on done: 6601.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:00,899][63734] Sum rewards: -2.816, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.529', 'AMMO5': '0.005', 'weapon5': '0.014', 'AMMO2': '0.033', 'ARMOR': '0.064', 'AMMO3': '0.090', 'WEAPON5': '0.100', 'AMMO4': '0.163', 'HITCOUNT': '0.170', 'WEAPON4': '0.250', 'weapon4': '0.360', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.594', 'FRAGCOUNT': '1.000', 'weapon3': '1.018', 'weapon2': '1.702'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:01,328][63734] DAMAGECOUNT value on done: 5519.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:01,329][63734] Sum rewards: -3.512, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.000', 'weapon4': '0.002', 'AMMO2': '0.014', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.070', 'AMMO3': '0.092', 'weapon5': '0.124', 'HITCOUNT': '0.190', 'WEAPON5': '0.250', 'HEALTH': '0.364', 'ARMOR': '0.480', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.579', 'weapon2': '1.062', 'weapon3': '1.874'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:01,550][63771] DAMAGECOUNT value on done: 6859.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:01,551][63771] Sum rewards: 1.729, reward structure: {'DEATHCOUNT': '-4.500', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.018', 'AMMO3': '0.050', 'AMMO4': '0.089', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'weapon7': '0.124', 'weapon5': '0.184', 'WEAPON3': '0.250', 'HEALTH': '0.268', 'DAMAGECOUNT': '0.393', 'ARMOR': '0.464', 'FRAGCOUNT': '1.000', 'weapon3': '1.260', 'weapon2': '1.604'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:01,981][63771] DAMAGECOUNT value on done: 4717.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:01,982][63771] Sum rewards: -5.476, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.036', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.010', 'WEAPON1': '0.020', 'ARMOR': '0.028', 'WEAPON5': '0.050', 'AMMO4': '0.050', 'AMMO3': '0.118', 'WEAPON4': '0.150', 'weapon4': '0.188', 'HITCOUNT': '0.200', 'DAMAGECOUNT': '0.456', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.472', 'weapon2': '1.654'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:02,458][109198] Fps is (10 sec: 10649.5, 60 sec: 10922.6, 300 sec: 11080.0). Total num frames: 10321920. Throughput: 0: 1551.4, 1: 1208.6. Samples: 2573255. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:02,460][109198] Avg episode reward: [(0, '-2.374'), (1, '-4.061')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:02,462][63576] Saving new best policy, reward=-4.061!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:04,789][63769] DAMAGECOUNT value on done: 5836.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:04,790][63769] Sum rewards: -1.796, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.666', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.010', 'AMMO5': '0.020', 'ARMOR': '0.044', 'AMMO4': '0.047', 'weapon7': '0.054', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.109', 'HITCOUNT': '0.200', 'weapon5': '0.204', 'WEAPON5': '0.350', 'WEAPON3': '0.700', 'weapon2': '1.342', 'weapon3': '1.636', 'DAMAGECOUNT': '1.854'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:05,186][63733] Updated weights for policy 1, policy_version 1250 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:05,218][63769] DAMAGECOUNT value on done: 6550.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:05,219][63769] Sum rewards: -1.741, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO5': '0.005', 'weapon5': '0.020', 'AMMO2': '0.028', 'ARMOR': '0.040', 'weapon4': '0.042', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'AMMO3': '0.061', 'AMMO4': '0.138', 'HITCOUNT': '0.170', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.423', 'HEALTH': '0.758', 'FRAGCOUNT': '1.000', 'weapon3': '1.200', 'weapon2': '2.174'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:05,701][63732] Updated weights for policy 0, policy_version 1280 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:07,458][109198] Fps is (10 sec: 10649.7, 60 sec: 10990.9, 300 sec: 11093.9). Total num frames: 10379264. Throughput: 0: 1548.1, 1: 1207.0. Samples: 2589737. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:07,460][109198] Avg episode reward: [(0, '-2.381'), (1, '-4.021')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:07,470][63576] Saving new best policy, reward=-4.021!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:08,146][63770] DAMAGECOUNT value on done: 7299.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:08,147][63770] Sum rewards: -0.156, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.490', 'AMMO4': '-0.042', 'AMMO2': '-0.008', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'weapon5': '0.046', 'weapon7': '0.066', 'AMMO3': '0.091', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'weapon4': '0.236', 'HITCOUNT': '0.330', 'WEAPON3': '0.700', 'ARMOR': '0.928', 'FRAGCOUNT': '1.000', 'weapon2': '1.206', 'DAMAGECOUNT': '1.332', 'weapon3': '1.532'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:08,424][63806] DAMAGECOUNT value on done: 6037.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:08,425][63806] Sum rewards: -2.341, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.286', 'AMMO5': '0.015', 'AMMO2': '0.016', 'weapon5': '0.042', 'AMMO4': '0.081', 'AMMO3': '0.092', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'ARMOR': '0.108', 'HITCOUNT': '0.120', 'WEAPON5': '0.150', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.426', 'weapon4': '0.450', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.128', 'weapon3': '1.616'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:08,565][63770] DAMAGECOUNT value on done: 4160.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:08,739][63806] DAMAGECOUNT value on done: 5932.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:08,740][63806] Sum rewards: 1.867, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.003', 'AMMO2': '0.019', 'weapon5': '0.030', 'WEAPON5': '0.050', 'ARMOR': '0.064', 'AMMO3': '0.090', 'AMMO4': '0.095', 'HITCOUNT': '0.110', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.450', 'HEALTH': '0.516', 'weapon2': '1.564', 'weapon3': '1.776', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:09,773][63735] DAMAGECOUNT value on done: 6027.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:09,773][63735] Sum rewards: -3.133, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.051', 'AMMO2': '0.007', 'ARMOR': '0.032', 'AMMO4': '0.033', 'AMMO3': '0.130', 'WEAPON4': '0.150', 'HITCOUNT': '0.290', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.200', 'weapon2': '1.684', 'weapon3': '1.692', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:10,106][63735] DAMAGECOUNT value on done: 5856.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:10,106][63735] Sum rewards: 0.247, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.214', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.019', 'WEAPON5': '0.050', 'HITCOUNT': '0.050', 'weapon5': '0.060', 'AMMO3': '0.075', 'AMMO4': '0.094', 'ARMOR': '0.096', 'weapon7': '0.158', 'DAMAGECOUNT': '0.165', 'WEAPON4': '0.200', 'AMMO6': '0.300', 'WEAPON7': '0.300', 'AMMO7': '0.300', 'WEAPON3': '0.350', 'weapon4': '0.558', 'weapon3': '0.922', 'FRAGCOUNT': '1.000', 'weapon2': '1.752'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:12,237][63732] Updated weights for policy 0, policy_version 1290 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:12,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11059.2, 300 sec: 11080.0). Total num frames: 10436608. Throughput: 0: 1552.7, 1: 1199.4. Samples: 2606228. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:12,460][109198] Avg episode reward: [(0, '-2.270'), (1, '-4.047')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:13,922][63733] Updated weights for policy 1, policy_version 1260 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:14,326][63805] DAMAGECOUNT value on done: 7993.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:14,327][63805] Sum rewards: -2.789, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.766', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'ARMOR': '0.012', 'AMMO2': '0.015', 'weapon5': '0.040', 'AMMO4': '0.072', 'weapon4': '0.074', 'AMMO3': '0.131', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'HITCOUNT': '0.350', 'WEAPON3': '0.800', 'weapon2': '0.854', 'DAMAGECOUNT': '1.425', 'FRAGCOUNT': '2.000', 'weapon3': '2.534'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:14,753][63805] DAMAGECOUNT value on done: 4760.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:14,753][63805] Sum rewards: -3.452, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.086', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.060', 'weapon4': '0.108', 'AMMO3': '0.127', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.750', 'weapon3': '1.666', 'weapon2': '1.788', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:15,446][63735] DAMAGECOUNT value on done: 6527.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:15,447][63735] Sum rewards: -1.432, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.280', 'AMMO2': '0.003', 'weapon4': '0.006', 'AMMO5': '0.010', 'ARMOR': '0.012', 'AMMO4': '0.017', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'weapon5': '0.110', 'AMMO3': '0.135', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.930', 'weapon2': '1.160', 'FRAGCOUNT': '2.000', 'weapon3': '2.214'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:15,822][63734] DAMAGECOUNT value on done: 6065.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:15,823][63734] Sum rewards: 1.770, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.504', 'AMMO4': '-0.020', 'AMMO2': '-0.004', 'WEAPON1': '0.010', 'AMMO5': '0.020', 'weapon7': '0.072', 'AMMO3': '0.084', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon5': '0.172', 'weapon4': '0.196', 'WEAPON7': '0.200', 'HITCOUNT': '0.240', 'WEAPON5': '0.350', 'ARMOR': '0.449', 'WEAPON3': '0.650', 'weapon2': '1.446', 'weapon3': '1.564', 'DAMAGECOUNT': '1.755', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:15,828][63735] DAMAGECOUNT value on done: 4100.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:15,828][63735] Sum rewards: -1.161, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.060', 'AMMO2': '0.004', 'weapon4': '0.010', 'WEAPON1': '0.020', 'AMMO4': '0.021', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'AMMO3': '0.113', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.747', 'WEAPON3': '0.750', 'weapon2': '1.708', 'weapon3': '1.730', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:16,219][63734] DAMAGECOUNT value on done: 4917.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:16,220][63734] Sum rewards: -1.574, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.792', 'AMMO2': '0.004', 'AMMO5': '0.017', 'AMMO4': '0.018', 'WEAPON1': '0.020', 'AMMO3': '0.113', 'WEAPON4': '0.200', 'HITCOUNT': '0.270', 'weapon5': '0.278', 'weapon4': '0.302', 'WEAPON5': '0.400', 'ARMOR': '0.484', 'WEAPON3': '0.750', 'weapon3': '1.060', 'DAMAGECOUNT': '1.134', 'weapon2': '1.418', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:16,557][63767] DAMAGECOUNT value on done: 6935.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:16,558][63767] Sum rewards: -3.600, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.773', 'AMMO2': '0.021', 'ARMOR': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.103', 'AMMO4': '0.103', 'HITCOUNT': '0.120', 'weapon4': '0.224', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.660', 'FRAGCOUNT': '1.000', 'weapon3': '1.286', 'weapon2': '1.956'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:16,947][63767] DAMAGECOUNT value on done: 6740.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:16,948][63767] Sum rewards: -2.769, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.104', 'AMMO5': '0.007', 'AMMO2': '0.014', 'ARMOR': '0.036', 'weapon5': '0.038', 'AMMO4': '0.072', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.122', 'HITCOUNT': '0.170', 'weapon4': '0.194', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.700', 'weapon3': '1.440', 'weapon2': '1.596', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:17,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10991.0, 300 sec: 11080.0). Total num frames: 10489856. Throughput: 0: 1560.1, 1: 1195.4. Samples: 2614549. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:17,460][109198] Avg episode reward: [(0, '-2.274'), (1, '-3.891')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:17,466][63576] Saving new best policy, reward=-3.891!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:17,688][63769] DAMAGECOUNT value on done: 6851.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:17,689][63769] Sum rewards: -5.008, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.005', 'AMMO2': '0.012', 'AMMO5': '0.025', 'weapon5': '0.032', 'AMMO4': '0.059', 'ARMOR': '0.064', 'weapon7': '0.072', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.133', 'HITCOUNT': '0.160', 'WEAPON7': '0.200', 'WEAPON5': '0.350', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.744', 'WEAPON3': '0.850', 'weapon2': '1.324', 'weapon3': '1.982'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:18,065][63771] DAMAGECOUNT value on done: 3675.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:18,066][63771] Sum rewards: -5.281, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.638', 'AMMO5': '0.005', 'AMMO2': '0.007', 'weapon5': '0.012', 'AMMO4': '0.034', 'ARMOR': '0.066', 'AMMO3': '0.090', 'WEAPON5': '0.100', 'HITCOUNT': '0.160', 'WEAPON4': '0.250', 'weapon4': '0.320', 'DAMAGECOUNT': '0.585', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.390', 'weapon3': '1.488'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:18,090][63769] DAMAGECOUNT value on done: 4942.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:18,090][63769] Sum rewards: -2.890, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.090', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.012', 'AMMO2': '0.016', 'weapon5': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.077', 'weapon4': '0.098', 'AMMO3': '0.114', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'ARMOR': '0.476', 'DAMAGECOUNT': '0.729', 'WEAPON3': '0.800', 'weapon2': '1.354', 'weapon3': '2.054'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:18,412][63771] DAMAGECOUNT value on done: 5963.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:18,412][63771] Sum rewards: -3.628, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.294', 'AMMO5': '0.005', 'AMMO2': '0.007', 'weapon5': '0.018', 'AMMO4': '0.033', 'ARMOR': '0.048', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.186', 'weapon4': '0.198', 'HITCOUNT': '0.250', 'DAMAGECOUNT': '0.831', 'WEAPON3': '0.900', 'weapon3': '1.608', 'weapon2': '1.632', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:18,422][63732] Updated weights for policy 0, policy_version 1300 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:18,514][63806] DAMAGECOUNT value on done: 4773.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:18,867][63806] DAMAGECOUNT value on done: 7374.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:18,867][63806] Sum rewards: 1.062, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.279', 'AMMO2': '0.009', 'AMMO5': '0.014', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'AMMO4': '0.043', 'WEAPON4': '0.050', 'weapon4': '0.052', 'AMMO3': '0.126', 'weapon5': '0.228', 'HITCOUNT': '0.280', 'WEAPON5': '0.300', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.122', 'weapon2': '1.280', 'weapon3': '1.866', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:19,907][63770] DAMAGECOUNT value on done: 5318.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:20,251][63770] DAMAGECOUNT value on done: 5831.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:20,252][63770] Sum rewards: -10.862, reward structure: {'DEATHCOUNT': '-13.500', 'FRAGCOUNT': '-3.000', 'HEALTH': '-1.074', 'AMMO5': '0.014', 'AMMO2': '0.020', 'ARMOR': '0.032', 'weapon5': '0.096', 'WEAPON4': '0.100', 'AMMO4': '0.101', 'HITCOUNT': '0.140', 'weapon4': '0.146', 'AMMO3': '0.199', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.531', 'WEAPON3': '1.050', 'weapon2': '1.670', 'weapon3': '1.712'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:22,330][63767] DAMAGECOUNT value on done: 8005.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:22,331][63767] Sum rewards: 1.065, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.086', 'AMMO5': '0.007', 'AMMO2': '0.013', 'weapon5': '0.030', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'weapon4': '0.056', 'AMMO4': '0.066', 'AMMO3': '0.142', 'WEAPON5': '0.150', 'HITCOUNT': '0.210', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.852', 'weapon3': '1.730', 'weapon2': '1.862', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:22,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11059.2, 300 sec: 11080.0). Total num frames: 10547200. Throughput: 0: 1575.4, 1: 1186.3. Samples: 2631256. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:22,460][109198] Avg episode reward: [(0, '-2.358'), (1, '-3.929')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:22,750][63767] DAMAGECOUNT value on done: 7825.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:23,126][63733] Updated weights for policy 1, policy_version 1270 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:24,696][63732] Updated weights for policy 0, policy_version 1310 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:24,748][63805] DAMAGECOUNT value on done: 7365.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:25,132][63805] DAMAGECOUNT value on done: 6591.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:25,133][63805] Sum rewards: -2.989, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.152', 'AMMO2': '0.011', 'AMMO5': '0.012', 'AMMO4': '0.055', 'AMMO3': '0.071', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'weapon4': '0.186', 'WEAPON5': '0.200', 'weapon5': '0.226', 'WEAPON3': '0.500', 'weapon3': '0.882', 'DAMAGECOUNT': '0.948', 'FRAGCOUNT': '1.500', 'weapon2': '1.772'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:26,084][63734] DAMAGECOUNT value on done: 6831.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:26,084][63734] Sum rewards: -1.565, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.712', 'AMMO2': '0.001', 'AMMO4': '0.006', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'weapon5': '0.024', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'weapon4': '0.054', 'AMMO3': '0.089', 'HITCOUNT': '0.140', 'WEAPON5': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.690', 'weapon3': '1.284', 'weapon2': '1.936', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:26,472][63734] DAMAGECOUNT value on done: 5814.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:26,472][63734] Sum rewards: -6.395, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.290', 'FRAGCOUNT': '-0.500', 'weapon4': '0.010', 'AMMO5': '0.015', 'WEAPON1': '0.030', 'AMMO2': '0.030', 'AMMO3': '0.138', 'WEAPON4': '0.150', 'AMMO4': '0.151', 'weapon5': '0.156', 'HITCOUNT': '0.230', 'WEAPON5': '0.350', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.885', 'weapon2': '1.138', 'weapon3': '1.762'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:26,783][63771] DAMAGECOUNT value on done: 7324.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:26,783][63771] Sum rewards: -2.841, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.886', 'AMMO2': '0.009', 'weapon7': '0.038', 'AMMO4': '0.045', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.167', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.258', 'HITCOUNT': '0.350', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.395', 'weapon2': '1.496', 'weapon3': '1.796', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:27,186][63771] DAMAGECOUNT value on done: 4877.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:27,186][63771] Sum rewards: -2.762, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.860', 'AMMO5': '0.005', 'AMMO2': '0.008', 'WEAPON1': '0.020', 'AMMO4': '0.040', 'weapon5': '0.052', 'ARMOR': '0.060', 'WEAPON5': '0.100', 'AMMO3': '0.119', 'HITCOUNT': '0.160', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.800', 'weapon2': '1.498', 'weapon3': '1.756', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:27,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10990.9, 300 sec: 11080.0). Total num frames: 10600448. Throughput: 0: 1590.1, 1: 1169.0. Samples: 2647759. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:27,460][109198] Avg episode reward: [(0, '-2.366'), (1, '-3.822')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:27,467][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001274_5218304.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:27,467][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001314_5382144.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:27,528][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000989_4050944.pth\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:27,529][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000952_3899392.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:27,536][63576] Saving new best policy, reward=-3.822!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:30,141][63769] DAMAGECOUNT value on done: 6036.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:30,142][63769] Sum rewards: -1.098, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.040', 'AMMO4': '-0.041', 'AMMO2': '-0.008', 'AMMO5': '0.005', 'weapon5': '0.042', 'ARMOR': '0.096', 'WEAPON5': '0.100', 'AMMO3': '0.110', 'HITCOUNT': '0.170', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.600', 'weapon2': '1.364', 'weapon3': '1.404', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:30,469][63769] DAMAGECOUNT value on done: 6695.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:30,470][63769] Sum rewards: -3.110, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.730', 'AMMO2': '0.018', 'weapon4': '0.040', 'WEAPON4': '0.050', 'AMMO3': '0.073', 'HITCOUNT': '0.090', 'AMMO4': '0.091', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.435', 'weapon3': '1.242', 'FRAGCOUNT': '2.000', 'weapon2': '2.280'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:30,625][63732] Updated weights for policy 0, policy_version 1320 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:31,579][63806] DAMAGECOUNT value on done: 6207.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:31,580][63806] Sum rewards: -0.667, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO2': '0.004', 'AMMO5': '0.017', 'AMMO4': '0.018', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'HEALTH': '0.116', 'HITCOUNT': '0.130', 'AMMO3': '0.136', 'WEAPON5': '0.250', 'weapon5': '0.284', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.510', 'ARMOR': '0.510', 'WEAPON3': '0.700', 'weapon3': '1.402', 'weapon2': '1.956'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:31,994][63806] DAMAGECOUNT value on done: 6127.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:31,994][63806] Sum rewards: -7.716, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.229', 'AMMO2': '0.003', 'AMMO4': '0.014', 'AMMO5': '0.018', 'WEAPON4': '0.050', 'ARMOR': '0.060', 'AMMO3': '0.156', 'HITCOUNT': '0.190', 'weapon4': '0.222', 'weapon5': '0.240', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.585', 'WEAPON3': '0.800', 'weapon2': '1.096', 'weapon3': '1.830'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:32,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11059.2, 300 sec: 11093.9). Total num frames: 10657792. Throughput: 0: 1602.6, 1: 1159.8. Samples: 2656120. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:32,460][109198] Avg episode reward: [(0, '-2.355'), (1, '-3.805')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:32,462][63576] Saving new best policy, reward=-3.805!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:32,635][63733] Updated weights for policy 1, policy_version 1280 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:33,303][63735] DAMAGECOUNT value on done: 6523.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:33,303][63735] Sum rewards: -5.791, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-3.432', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'AMMO5': '0.016', 'WEAPON1': '0.020', 'weapon7': '0.022', 'ARMOR': '0.052', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.191', 'HITCOUNT': '0.200', 'weapon5': '0.216', 'WEAPON5': '0.400', 'WEAPON3': '0.950', 'weapon3': '1.278', 'DAMAGECOUNT': '1.488', 'weapon2': '2.022', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:33,446][63770] DAMAGECOUNT value on done: 7471.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:33,447][63770] Sum rewards: -6.407, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.520', 'AMMO2': '0.001', 'AMMO4': '0.006', 'AMMO5': '0.015', 'ARMOR': '0.020', 'WEAPON1': '0.030', 'weapon4': '0.034', 'WEAPON4': '0.050', 'weapon5': '0.076', 'weapon7': '0.080', 'HITCOUNT': '0.170', 'AMMO3': '0.195', 'WEAPON7': '0.200', 'AMMO6': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.516', 'WEAPON3': '1.050', 'weapon2': '1.404', 'FRAGCOUNT': '1.500', 'weapon3': '1.866'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:33,674][63735] DAMAGECOUNT value on done: 6121.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:33,675][63735] Sum rewards: 0.537, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.520', 'AMMO2': '0.001', 'AMMO4': '0.005', 'AMMO5': '0.012', 'ARMOR': '0.036', 'AMMO3': '0.100', 'weapon5': '0.172', 'HITCOUNT': '0.270', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.795', 'weapon2': '1.022', 'weapon3': '2.244', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:33,839][63770] DAMAGECOUNT value on done: 4445.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:33,839][63770] Sum rewards: -2.303, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.073', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.016', 'weapon5': '0.022', 'WEAPON4': '0.050', 'AMMO4': '0.082', 'WEAPON5': '0.100', 'AMMO3': '0.110', 'HITCOUNT': '0.130', 'weapon4': '0.180', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.855', 'FRAGCOUNT': '1.000', 'weapon3': '1.450', 'weapon2': '1.710'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:36,576][63732] Updated weights for policy 0, policy_version 1330 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:37,458][109198] Fps is (10 sec: 11059.1, 60 sec: 10990.9, 300 sec: 11066.1). Total num frames: 10711040. Throughput: 0: 1621.8, 1: 1136.5. Samples: 2672769. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:37,460][109198] Avg episode reward: [(0, '-2.388'), (1, '-3.768')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:37,528][63576] Saving new best policy, reward=-3.768!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:38,916][63767] DAMAGECOUNT value on done: 7107.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:39,192][63735] Large shaping reward -2.504 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.255, -85.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:39,263][63767] DAMAGECOUNT value on done: 6950.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:39,264][63767] Sum rewards: -3.959, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.825', 'AMMO4': '-0.045', 'AMMO2': '-0.009', 'weapon5': '0.008', 'AMMO5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.056', 'AMMO3': '0.073', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.190', 'weapon4': '0.208', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.630', 'weapon3': '1.170', 'weapon2': '1.750'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:39,391][63805] DAMAGECOUNT value on done: 8493.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:39,392][63805] Sum rewards: -3.169, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.408', 'AMMO2': '0.006', 'AMMO5': '0.018', 'AMMO4': '0.031', 'AMMO3': '0.185', 'weapon5': '0.228', 'HITCOUNT': '0.390', 'WEAPON5': '0.400', 'weapon2': '1.064', 'WEAPON3': '1.100', 'DAMAGECOUNT': '1.500', 'weapon3': '2.316', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:39,806][63734] DAMAGECOUNT value on done: 6360.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:39,807][63734] Sum rewards: -3.445, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.478', 'AMMO2': '0.010', 'AMMO5': '0.028', 'ARMOR': '0.028', 'weapon4': '0.042', 'AMMO4': '0.049', 'WEAPON1': '0.050', 'weapon5': '0.090', 'WEAPON4': '0.100', 'AMMO3': '0.165', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.230', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.885', 'WEAPON3': '1.000', 'weapon2': '1.366', 'weapon3': '1.990', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:39,820][63805] DAMAGECOUNT value on done: 5045.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:39,820][63805] Sum rewards: -1.205, reward structure: {'DEATHCOUNT': '-9.000', 'AMMO5': '0.010', 'weapon5': '0.012', 'AMMO2': '0.013', 'HEALTH': '0.018', 'AMMO4': '0.066', 'WEAPON4': '0.100', 'AMMO3': '0.103', 'weapon4': '0.112', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'ARMOR': '0.493', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.855', 'weapon3': '1.506', 'weapon2': '1.546', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:40,192][63734] DAMAGECOUNT value on done: 5119.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:40,193][63734] Sum rewards: -3.586, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.478', 'AMMO5': '0.005', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.062', 'AMMO3': '0.121', 'weapon5': '0.138', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.606', 'WEAPON3': '0.750', 'ARMOR': '0.846', 'FRAGCOUNT': '1.500', 'weapon3': '1.544', 'weapon2': '1.718'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:40,234][63735] DAMAGECOUNT value on done: 7242.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:40,235][63735] Sum rewards: -1.419, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.926', 'AMMO5': '0.010', 'AMMO2': '0.028', 'ARMOR': '0.040', 'WEAPON1': '0.040', 'weapon4': '0.050', 'AMMO4': '0.140', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon5': '0.152', 'AMMO3': '0.157', 'HITCOUNT': '0.410', 'WEAPON3': '0.850', 'weapon2': '1.696', 'weapon3': '1.738', 'DAMAGECOUNT': '2.145', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:40,537][63771] DAMAGECOUNT value on done: 3930.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:40,596][63735] DAMAGECOUNT value on done: 4188.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:40,596][63735] Sum rewards: -2.707, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.851', 'AMMO5': '0.007', 'AMMO2': '0.018', 'ARMOR': '0.032', 'AMMO3': '0.066', 'AMMO4': '0.089', 'HITCOUNT': '0.110', 'weapon5': '0.124', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.264', 'weapon4': '0.354', 'WEAPON3': '0.450', 'FRAGCOUNT': '0.500', 'weapon3': '1.186', 'weapon2': '1.394'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:40,932][63771] DAMAGECOUNT value on done: 6308.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:40,933][63771] Sum rewards: -3.789, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.175', 'WEAPON1': '0.020', 'AMMO2': '0.039', 'ARMOR': '0.052', 'WEAPON4': '0.100', 'AMMO3': '0.151', 'AMMO4': '0.193', 'weapon4': '0.210', 'HITCOUNT': '0.250', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.035', 'weapon3': '1.576', 'weapon2': '1.710'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:41,660][63769] DAMAGECOUNT value on done: 7310.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:41,660][63769] Sum rewards: 0.655, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.300', 'AMMO2': '0.006', 'ARMOR': '0.008', 'WEAPON1': '0.020', 'AMMO5': '0.025', 'AMMO4': '0.031', 'weapon7': '0.058', 'AMMO3': '0.073', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'weapon5': '0.218', 'HITCOUNT': '0.280', 'weapon4': '0.326', 'WEAPON5': '0.400', 'WEAPON3': '0.500', 'weapon2': '0.702', 'weapon3': '1.140', 'DAMAGECOUNT': '1.377', 'FRAGCOUNT': '1.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:42,048][63769] DAMAGECOUNT value on done: 5445.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:42,049][63769] Sum rewards: 2.934, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.380', 'ARMOR': '0.008', 'AMMO2': '0.011', 'AMMO5': '0.013', 'AMMO4': '0.053', 'AMMO3': '0.096', 'weapon5': '0.176', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'weapon4': '0.336', 'WEAPON3': '0.550', 'weapon2': '1.270', 'DAMAGECOUNT': '1.509', 'weapon3': '1.622', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:42,459][109198] Fps is (10 sec: 10649.4, 60 sec: 10990.9, 300 sec: 11066.1). Total num frames: 10764288. Throughput: 0: 1645.4, 1: 1113.7. Samples: 2689390. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:42,461][109198] Avg episode reward: [(0, '-2.423'), (1, '-3.711')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:42,474][63576] Saving new best policy, reward=-3.711!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:42,478][63732] Updated weights for policy 0, policy_version 1340 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:42,480][63733] Updated weights for policy 1, policy_version 1290 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:42,524][63735] Large shaping reward -2.534 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.28500000000000003, -95.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:43,269][63806] DAMAGECOUNT value on done: 4828.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:43,701][63806] DAMAGECOUNT value on done: 7869.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:43,701][63806] Sum rewards: -0.760, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.719', 'AMMO2': '0.006', 'AMMO5': '0.010', 'AMMO4': '0.031', 'WEAPON4': '0.050', 'ARMOR': '0.059', 'weapon4': '0.076', 'WEAPON5': '0.100', 'AMMO3': '0.132', 'weapon5': '0.168', 'HITCOUNT': '0.360', 'WEAPON3': '0.900', 'weapon2': '0.914', 'DAMAGECOUNT': '1.485', 'FRAGCOUNT': '1.500', 'weapon3': '2.418'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:45,074][63770] DAMAGECOUNT value on done: 5574.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:45,075][63770] Sum rewards: -1.853, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.678', 'AMMO4': '-0.004', 'AMMO2': '-0.001', 'AMMO5': '0.003', 'ARMOR': '0.020', 'WEAPON5': '0.050', 'AMMO3': '0.105', 'weapon5': '0.116', 'HITCOUNT': '0.190', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.768', 'FRAGCOUNT': '1.000', 'weapon3': '1.280', 'weapon2': '1.448'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:45,441][63770] DAMAGECOUNT value on done: 6403.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:45,441][63770] Sum rewards: 2.498, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.640', 'AMMO2': '0.005', 'AMMO5': '0.016', 'WEAPON1': '0.020', 'AMMO4': '0.025', 'AMMO3': '0.117', 'WEAPON4': '0.200', 'weapon4': '0.262', 'WEAPON5': '0.300', 'HITCOUNT': '0.360', 'weapon5': '0.372', 'ARMOR': '0.516', 'WEAPON3': '0.600', 'weapon3': '1.318', 'weapon2': '1.560', 'DAMAGECOUNT': '1.716', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:45,540][63767] DAMAGECOUNT value on done: 8259.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:45,541][63767] Sum rewards: -1.651, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.528', 'AMMO2': '0.010', 'AMMO5': '0.021', 'AMMO4': '0.050', 'ARMOR': '0.088', 'WEAPON4': '0.100', 'AMMO3': '0.149', 'HITCOUNT': '0.150', 'weapon5': '0.162', 'weapon4': '0.302', 'WEAPON5': '0.350', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.762', 'weapon2': '1.432', 'weapon3': '1.600', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:45,920][63767] DAMAGECOUNT value on done: 8199.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:45,921][63767] Sum rewards: -4.952, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-2.000', 'HEALTH': '-0.018', 'WEAPON1': '0.010', 'AMMO2': '0.016', 'AMMO5': '0.020', 'ARMOR': '0.024', 'AMMO4': '0.082', 'AMMO3': '0.122', 'HITCOUNT': '0.140', 'weapon5': '0.160', 'WEAPON5': '0.350', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.122', 'weapon2': '1.498', 'weapon3': '1.822'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:47,458][109198] Fps is (10 sec: 11059.3, 60 sec: 10990.9, 300 sec: 11066.1). Total num frames: 10821632. Throughput: 0: 1655.0, 1: 1114.4. Samples: 2697876. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:47,460][109198] Avg episode reward: [(0, '-2.461'), (1, '-3.647')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:47,467][63576] Saving new best policy, reward=-3.647!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:48,456][63805] DAMAGECOUNT value on done: 7896.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:48,457][63805] Sum rewards: -0.949, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.192', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'weapon4': '0.020', 'AMMO2': '0.020', 'ARMOR': '0.048', 'weapon5': '0.088', 'WEAPON4': '0.100', 'AMMO4': '0.101', 'AMMO3': '0.116', 'WEAPON5': '0.250', 'HITCOUNT': '0.310', 'WEAPON3': '0.650', 'weapon3': '1.568', 'DAMAGECOUNT': '1.593', 'weapon2': '1.846', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:48,804][63805] DAMAGECOUNT value on done: 6929.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:48,804][63805] Sum rewards: 1.751, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.226', 'AMMO4': '-0.043', 'AMMO2': '-0.009', 'AMMO5': '0.009', 'WEAPON1': '0.010', 'ARMOR': '0.016', 'weapon5': '0.074', 'AMMO3': '0.114', 'weapon7': '0.136', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'AMMO6': '0.240', 'AMMO7': '0.240', 'WEAPON7': '0.400', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.014', 'weapon2': '1.274', 'weapon3': '1.982', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:48,929][63732] Updated weights for policy 0, policy_version 1350 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:50,916][63733] Updated weights for policy 1, policy_version 1300 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:51,450][63734] DAMAGECOUNT value on done: 7189.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:51,450][63734] Sum rewards: -4.637, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.520', 'AMMO4': '-0.031', 'AMMO2': '-0.006', 'AMMO5': '0.003', 'ARMOR': '0.040', 'weapon5': '0.060', 'WEAPON5': '0.100', 'AMMO3': '0.115', 'HITCOUNT': '0.200', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.074', 'weapon3': '1.470', 'weapon2': '1.858'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:51,895][63734] DAMAGECOUNT value on done: 6199.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:51,896][63734] Sum rewards: -6.061, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.959', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'AMMO5': '0.008', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'weapon5': '0.062', 'weapon4': '0.080', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON5': '0.150', 'AMMO3': '0.177', 'HITCOUNT': '0.320', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.155', 'weapon3': '1.504', 'weapon2': '1.808', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:51,906][63771] DAMAGECOUNT value on done: 7559.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:51,907][63771] Sum rewards: -3.501, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.990', 'AMMO2': '0.004', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.018', 'weapon5': '0.046', 'AMMO3': '0.146', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'ARMOR': '0.424', 'DAMAGECOUNT': '0.705', 'WEAPON3': '0.900', 'weapon2': '1.090', 'FRAGCOUNT': '2.000', 'weapon3': '2.226'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:52,240][63771] DAMAGECOUNT value on done: 5111.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:52,241][63771] Sum rewards: -3.077, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.575', 'AMMO2': '0.002', 'AMMO4': '0.008', 'AMMO5': '0.009', 'ARMOR': '0.016', 'WEAPON1': '0.020', 'AMMO3': '0.075', 'weapon5': '0.112', 'HITCOUNT': '0.140', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'weapon4': '0.230', 'WEAPON3': '0.400', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.702', 'weapon3': '0.972', 'weapon2': '1.712'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:52,458][109198] Fps is (10 sec: 11469.1, 60 sec: 11059.2, 300 sec: 11080.0). Total num frames: 10878976. Throughput: 0: 1657.4, 1: 1116.9. Samples: 2714581. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:52,459][109198] Avg episode reward: [(0, '-2.423'), (1, '-3.660')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:54,989][63806] DAMAGECOUNT value on done: 6675.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:54,990][63806] Sum rewards: -4.429, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.106', 'AMMO4': '-0.034', 'AMMO2': '-0.007', 'AMMO5': '0.017', 'ARMOR': '0.020', 'weapon5': '0.176', 'AMMO3': '0.184', 'WEAPON5': '0.350', 'HITCOUNT': '0.400', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.404', 'weapon2': '1.540', 'weapon3': '1.776'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:55,328][63806] DAMAGECOUNT value on done: 6257.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:55,328][63806] Sum rewards: -1.617, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.848', 'AMMO5': '0.015', 'weapon5': '0.028', 'AMMO2': '0.039', 'HITCOUNT': '0.120', 'AMMO3': '0.143', 'AMMO4': '0.193', 'WEAPON4': '0.200', 'weapon4': '0.222', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.390', 'ARMOR': '0.400', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.024', 'weapon3': '1.858'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:55,358][63769] DAMAGECOUNT value on done: 6185.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:55,359][63769] Sum rewards: -3.608, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.180', 'AMMO2': '0.002', 'AMMO4': '0.008', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'weapon5': '0.072', 'AMMO3': '0.106', 'HITCOUNT': '0.140', 'weapon7': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.376', 'AMMO6': '0.420', 'AMMO7': '0.420', 'DAMAGECOUNT': '0.447', 'WEAPON7': '0.500', 'WEAPON3': '0.600', 'weapon3': '0.894', 'weapon2': '1.592', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:55,613][63732] Updated weights for policy 0, policy_version 1360 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:55,844][63769] DAMAGECOUNT value on done: 6807.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:56,676][63735] DAMAGECOUNT value on done: 7000.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:56,676][63735] Sum rewards: -6.758, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.684', 'FRAGCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.014', 'AMMO4': '0.022', 'ARMOR': '0.028', 'AMMO3': '0.170', 'weapon5': '0.260', 'WEAPON5': '0.300', 'HITCOUNT': '0.370', 'WEAPON3': '0.800', 'weapon2': '1.344', 'DAMAGECOUNT': '1.431', 'weapon3': '1.932'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:57,041][63735] DAMAGECOUNT value on done: 6906.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:57,042][63735] Sum rewards: 0.212, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.716', 'AMMO2': '0.010', 'AMMO5': '0.022', 'WEAPON1': '0.030', 'AMMO4': '0.049', 'AMMO3': '0.182', 'weapon5': '0.292', 'HITCOUNT': '0.370', 'WEAPON5': '0.450', 'WEAPON3': '1.000', 'weapon2': '1.156', 'weapon3': '2.012', 'DAMAGECOUNT': '2.355', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:57,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11059.2, 300 sec: 11080.0). Total num frames: 10936320. Throughput: 0: 1645.1, 1: 1136.3. Samples: 2731389. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:52:57,460][109198] Avg episode reward: [(0, '-2.502'), (1, '-3.677')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:58,785][63733] Updated weights for policy 1, policy_version 1310 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:58,875][63770] DAMAGECOUNT value on done: 7617.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:59,284][63770] DAMAGECOUNT value on done: 4627.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:52:59,284][63770] Sum rewards: -0.023, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.572', 'AMMO2': '0.007', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'weapon4': '0.012', 'AMMO4': '0.037', 'WEAPON4': '0.050', 'weapon5': '0.074', 'AMMO3': '0.132', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'ARMOR': '0.445', 'DAMAGECOUNT': '0.546', 'WEAPON3': '0.700', 'weapon3': '1.502', 'weapon2': '1.904', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:01,310][63767] DAMAGECOUNT value on done: 7237.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:01,311][63767] Sum rewards: -5.067, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.000', 'HEALTH': '-0.340', 'AMMO5': '0.005', 'AMMO2': '0.018', 'WEAPON1': '0.030', 'AMMO4': '0.088', 'AMMO3': '0.088', 'WEAPON5': '0.100', 'HITCOUNT': '0.130', 'weapon5': '0.244', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.450', 'weapon3': '1.092', 'weapon2': '1.888'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:01,653][63767] DAMAGECOUNT value on done: 7025.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:01,653][63767] Sum rewards: -7.776, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.972', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.007', 'AMMO2': '0.018', 'WEAPON1': '0.030', 'AMMO3': '0.059', 'HITCOUNT': '0.060', 'AMMO4': '0.089', 'weapon5': '0.130', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon4': '0.160', 'DAMAGECOUNT': '0.225', 'ARMOR': '0.432', 'WEAPON3': '0.450', 'weapon3': '0.834', 'weapon2': '1.902'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:02,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11127.5, 300 sec: 11066.1). Total num frames: 10989568. Throughput: 0: 1637.0, 1: 1149.5. Samples: 2739941. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:02,460][109198] Avg episode reward: [(0, '-2.591'), (1, '-3.754')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:02,485][63732] Updated weights for policy 0, policy_version 1370 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:04,172][63771] DAMAGECOUNT value on done: 4148.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:04,173][63771] Sum rewards: -0.235, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.062', 'AMMO5': '0.014', 'ARMOR': '0.028', 'AMMO2': '0.028', 'WEAPON4': '0.100', 'weapon5': '0.126', 'AMMO3': '0.130', 'AMMO4': '0.140', 'HITCOUNT': '0.230', 'WEAPON5': '0.300', 'weapon4': '0.392', 'DAMAGECOUNT': '0.654', 'WEAPON3': '0.750', 'weapon2': '1.138', 'weapon3': '1.796', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:04,187][63805] DAMAGECOUNT value on done: 8717.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:04,188][63805] Sum rewards: -3.777, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.807', 'AMMO5': '0.010', 'AMMO2': '0.024', 'AMMO4': '0.117', 'HITCOUNT': '0.140', 'AMMO3': '0.151', 'weapon5': '0.222', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'weapon4': '0.308', 'ARMOR': '0.444', 'DAMAGECOUNT': '0.672', 'WEAPON3': '0.800', 'weapon2': '0.962', 'FRAGCOUNT': '1.000', 'weapon3': '1.630'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:04,578][63771] DAMAGECOUNT value on done: 6546.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:04,579][63771] Sum rewards: -2.509, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.001', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.018', 'ARMOR': '0.064', 'AMMO4': '0.092', 'WEAPON4': '0.100', 'weapon4': '0.138', 'AMMO3': '0.158', 'HITCOUNT': '0.180', 'weapon5': '0.190', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.714', 'FRAGCOUNT': '1.500', 'weapon2': '1.568', 'weapon3': '1.598'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:04,580][63805] DAMAGECOUNT value on done: 5145.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:04,580][63805] Sum rewards: -2.819, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.418', 'AMMO5': '0.005', 'AMMO2': '0.008', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'AMMO4': '0.039', 'weapon5': '0.062', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.107', 'HITCOUNT': '0.120', 'weapon4': '0.162', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.522', 'weapon3': '1.568'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:04,808][63735] DAMAGECOUNT value on done: 7317.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:04,809][63735] Sum rewards: -5.088, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.876', 'AMMO5': '0.017', 'AMMO2': '0.018', 'HITCOUNT': '0.070', 'AMMO4': '0.087', 'AMMO3': '0.112', 'weapon5': '0.176', 'DAMAGECOUNT': '0.225', 'WEAPON4': '0.250', 'WEAPON5': '0.300', 'weapon4': '0.306', 'ARMOR': '0.436', 'WEAPON3': '0.600', 'weapon2': '1.346', 'weapon3': '1.594'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:04,861][63769] DAMAGECOUNT value on done: 7626.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:04,862][63769] Sum rewards: -7.164, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.344', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO2': '0.012', 'ARMOR': '0.020', 'WEAPON1': '0.040', 'weapon4': '0.044', 'AMMO4': '0.059', 'WEAPON5': '0.100', 'WEAPON4': '0.150', 'AMMO3': '0.230', 'HITCOUNT': '0.290', 'DAMAGECOUNT': '0.948', 'WEAPON3': '1.250', 'weapon2': '1.368', 'FRAGCOUNT': '2.000', 'weapon3': '2.158'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:05,199][63735] DAMAGECOUNT value on done: 4378.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:05,200][63735] Sum rewards: -1.677, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.332', 'AMMO2': '0.006', 'AMMO5': '0.013', 'AMMO4': '0.030', 'WEAPON4': '0.050', 'weapon4': '0.090', 'HITCOUNT': '0.130', 'AMMO3': '0.138', 'weapon5': '0.194', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.850', 'weapon2': '1.348', 'weapon3': '1.986', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:05,219][63734] DAMAGECOUNT value on done: 6576.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:05,220][63734] Sum rewards: -1.208, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.076', 'AMMO5': '0.003', 'AMMO2': '0.006', 'ARMOR': '0.020', 'AMMO4': '0.029', 'WEAPON5': '0.050', 'weapon7': '0.066', 'AMMO3': '0.069', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'HITCOUNT': '0.170', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.648', 'weapon3': '0.890', 'weapon2': '1.668', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:05,248][63769] DAMAGECOUNT value on done: 5726.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:05,248][63769] Sum rewards: -5.028, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.828', 'AMMO2': '0.004', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO4': '0.021', 'ARMOR': '0.033', 'AMMO3': '0.103', 'WEAPON5': '0.150', 'HITCOUNT': '0.270', 'weapon5': '0.292', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.843', 'weapon2': '1.432', 'weapon3': '1.672'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:05,612][63734] DAMAGECOUNT value on done: 5339.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:05,613][63734] Sum rewards: -1.505, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.419', 'AMMO5': '0.005', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'AMMO4': '0.039', 'AMMO3': '0.100', 'ARMOR': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.100', 'HITCOUNT': '0.140', 'weapon5': '0.140', 'WEAPON5': '0.150', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.660', 'FRAGCOUNT': '1.000', 'weapon3': '1.498', 'weapon2': '1.814'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:05,889][63806] DAMAGECOUNT value on done: 4997.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:05,889][63806] Sum rewards: -4.900, reward structure: {'DEATHCOUNT': '-11.250', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO2': '0.023', 'weapon5': '0.042', 'ARMOR': '0.056', 'AMMO3': '0.092', 'AMMO4': '0.112', 'HEALTH': '0.148', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'weapon4': '0.344', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.298', 'weapon2': '1.630'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:06,214][63806] DAMAGECOUNT value on done: 8174.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:06,215][63806] Sum rewards: -4.299, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.410', 'ARMOR': '0.008', 'AMMO5': '0.012', 'AMMO2': '0.015', 'weapon5': '0.064', 'AMMO4': '0.075', 'AMMO3': '0.085', 'WEAPON5': '0.100', 'weapon4': '0.146', 'HITCOUNT': '0.250', 'WEAPON4': '0.250', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.915', 'weapon3': '1.262', 'weapon2': '1.828', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:06,477][63733] Updated weights for policy 1, policy_version 1320 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:07,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11127.5, 300 sec: 11066.1). Total num frames: 11046912. Throughput: 0: 1608.1, 1: 1179.9. Samples: 2756716. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:07,460][109198] Avg episode reward: [(0, '-2.590'), (1, '-3.612')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:07,466][63576] Saving new best policy, reward=-3.612!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:08,786][63767] DAMAGECOUNT value on done: 8680.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:08,787][63767] Sum rewards: 4.721, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.013', 'AMMO5': '0.010', 'AMMO2': '0.032', 'AMMO3': '0.056', 'WEAPON5': '0.150', 'AMMO4': '0.161', 'WEAPON4': '0.250', 'HITCOUNT': '0.290', 'WEAPON3': '0.300', 'weapon5': '0.332', 'ARMOR': '0.432', 'weapon4': '0.668', 'weapon3': '0.684', 'DAMAGECOUNT': '1.263', 'weapon2': '1.356', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:09,127][63767] DAMAGECOUNT value on done: 8554.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:09,127][63767] Sum rewards: -3.832, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.244', 'AMMO5': '0.007', 'ARMOR': '0.020', 'WEAPON1': '0.020', 'AMMO2': '0.028', 'weapon5': '0.044', 'AMMO3': '0.130', 'AMMO4': '0.142', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon4': '0.262', 'HITCOUNT': '0.300', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.020', 'weapon2': '1.512', 'weapon3': '1.526'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:09,940][63732] Updated weights for policy 0, policy_version 1380 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:10,614][63770] DAMAGECOUNT value on done: 5841.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:10,615][63770] Sum rewards: -4.404, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.252', 'AMMO5': '0.005', 'AMMO2': '0.014', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'weapon5': '0.046', 'weapon4': '0.062', 'AMMO4': '0.071', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.133', 'weapon7': '0.184', 'HITCOUNT': '0.210', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.801', 'WEAPON3': '0.850', 'weapon2': '1.334', 'weapon3': '1.818'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:11,018][63770] DAMAGECOUNT value on done: 6776.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:11,018][63770] Sum rewards: -3.679, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.732', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'AMMO2': '0.022', 'WEAPON5': '0.050', 'ARMOR': '0.072', 'weapon7': '0.092', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO4': '0.110', 'AMMO3': '0.167', 'weapon5': '0.194', 'HITCOUNT': '0.240', 'WEAPON4': '0.250', 'weapon4': '0.408', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.119', 'weapon2': '1.304', 'weapon3': '1.452'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:11,739][63805] DAMAGECOUNT value on done: 8512.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:11,740][63805] Sum rewards: -0.836, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.963', 'AMMO2': '0.008', 'ARMOR': '0.008', 'AMMO5': '0.020', 'WEAPON1': '0.020', 'AMMO4': '0.039', 'WEAPON4': '0.050', 'weapon4': '0.080', 'AMMO3': '0.122', 'weapon5': '0.146', 'WEAPON5': '0.400', 'HITCOUNT': '0.440', 'WEAPON3': '0.750', 'weapon2': '1.338', 'DAMAGECOUNT': '1.848', 'weapon3': '1.858', 'FRAGCOUNT': '3.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:12,080][63805] DAMAGECOUNT value on done: 7725.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:12,080][63805] Sum rewards: 2.175, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.870', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.021', 'ARMOR': '0.044', 'weapon5': '0.092', 'AMMO3': '0.099', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.104', 'weapon7': '0.110', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'weapon4': '0.226', 'WEAPON3': '0.600', 'weapon2': '1.434', 'weapon3': '1.480', 'DAMAGECOUNT': '1.500', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:12,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11127.5, 300 sec: 11066.1). Total num frames: 11104256. Throughput: 0: 1563.0, 1: 1232.8. Samples: 2773570. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:12,460][109198] Avg episode reward: [(0, '-2.405'), (1, '-3.615')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:13,225][63733] Updated weights for policy 1, policy_version 1330 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:15,099][63771] DAMAGECOUNT value on done: 7804.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:15,100][63771] Sum rewards: -3.412, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.150', 'AMMO2': '0.006', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.029', 'ARMOR': '0.084', 'AMMO3': '0.118', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'weapon5': '0.182', 'WEAPON4': '0.200', 'weapon4': '0.284', 'DAMAGECOUNT': '0.735', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.320', 'weapon3': '1.632'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:15,508][63771] DAMAGECOUNT value on done: 5169.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:16,671][63734] DAMAGECOUNT value on done: 7359.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:16,671][63734] Sum rewards: -1.837, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.856', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.018', 'ARMOR': '0.036', 'AMMO3': '0.066', 'AMMO4': '0.089', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon5': '0.152', 'weapon4': '0.192', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.510', 'weapon3': '0.934', 'FRAGCOUNT': '1.000', 'weapon2': '1.900'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:17,061][63734] DAMAGECOUNT value on done: 6369.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:17,062][63734] Sum rewards: -2.528, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.429', 'AMMO2': '0.010', 'AMMO5': '0.027', 'AMMO4': '0.052', 'WEAPON4': '0.100', 'AMMO3': '0.117', 'HITCOUNT': '0.140', 'weapon5': '0.174', 'weapon4': '0.270', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.510', 'ARMOR': '0.559', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.332', 'weapon3': '1.610'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:17,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11195.7, 300 sec: 11080.0). Total num frames: 11161600. Throughput: 0: 1538.1, 1: 1262.2. Samples: 2782137. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:17,460][109198] Avg episode reward: [(0, '-2.362'), (1, '-3.477')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:17,467][63576] Saving new best policy, reward=-3.477!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:17,573][63732] Updated weights for policy 0, policy_version 1390 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:17,751][63806] DAMAGECOUNT value on done: 7150.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:17,751][63806] Sum rewards: -3.673, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.118', 'AMMO2': '0.013', 'AMMO5': '0.017', 'ARMOR': '0.032', 'weapon5': '0.050', 'AMMO4': '0.066', 'WEAPON4': '0.100', 'AMMO3': '0.170', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'weapon4': '0.342', 'weapon2': '1.088', 'WEAPON3': '1.100', 'DAMAGECOUNT': '1.425', 'FRAGCOUNT': '2.000', 'weapon3': '2.032'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:18,081][63806] DAMAGECOUNT value on done: 6596.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:18,082][63806] Sum rewards: -2.430, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.729', 'AMMO5': '0.005', 'AMMO2': '0.018', 'WEAPON5': '0.050', 'weapon5': '0.060', 'AMMO4': '0.087', 'AMMO3': '0.151', 'HITCOUNT': '0.200', 'WEAPON4': '0.400', 'FRAGCOUNT': '0.500', 'weapon2': '0.530', 'weapon4': '0.670', 'WEAPON3': '0.850', 'ARMOR': '0.971', 'DAMAGECOUNT': '1.017', 'weapon3': '2.040'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:19,956][63735] DAMAGECOUNT value on done: 7175.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:19,957][63735] Sum rewards: -4.859, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.480', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.008', 'weapon7': '0.068', 'WEAPON4': '0.100', 'weapon5': '0.108', 'weapon4': '0.112', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.136', 'HITCOUNT': '0.150', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.525', 'WEAPON3': '0.750', 'weapon2': '1.118', 'weapon3': '1.666'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:20,270][63733] Updated weights for policy 1, policy_version 1340 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:20,299][63735] DAMAGECOUNT value on done: 7160.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:20,299][63735] Sum rewards: -2.036, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.965', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'weapon4': '0.012', 'AMMO2': '0.012', 'weapon5': '0.024', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'AMMO4': '0.061', 'AMMO3': '0.118', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.762', 'weapon2': '1.648', 'weapon3': '1.888', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:20,615][63769] DAMAGECOUNT value on done: 6735.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:20,616][63769] Sum rewards: -5.358, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.808', 'AMMO4': '-0.014', 'AMMO2': '-0.003', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'weapon7': '0.070', 'weapon5': '0.104', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.135', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.330', 'WEAPON3': '0.700', 'weapon2': '1.466', 'FRAGCOUNT': '1.500', 'weapon3': '1.592', 'DAMAGECOUNT': '1.650'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:21,008][63769] DAMAGECOUNT value on done: 7028.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:21,008][63769] Sum rewards: -0.119, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO2': '0.031', 'WEAPON4': '0.100', 'AMMO3': '0.125', 'AMMO4': '0.154', 'HEALTH': '0.224', 'HITCOUNT': '0.240', 'weapon4': '0.404', 'ARMOR': '0.460', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.663', 'weapon2': '1.538', 'weapon3': '1.542', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:22,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11127.4, 300 sec: 11066.1). Total num frames: 11214848. Throughput: 0: 1493.6, 1: 1314.4. Samples: 2799127. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:22,461][109198] Avg episode reward: [(0, '-2.447'), (1, '-3.494')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:24,284][63767] DAMAGECOUNT value on done: 7642.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:24,284][63767] Sum rewards: 0.887, reward structure: {'DEATHCOUNT': '-9.000', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'AMMO2': '0.024', 'weapon5': '0.098', 'AMMO3': '0.104', 'AMMO4': '0.120', 'weapon4': '0.150', 'HEALTH': '0.156', 'WEAPON4': '0.250', 'HITCOUNT': '0.300', 'WEAPON5': '0.300', 'ARMOR': '0.412', 'WEAPON3': '0.550', 'DAMAGECOUNT': '1.215', 'weapon2': '1.516', 'weapon3': '1.664', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:24,426][63770] DAMAGECOUNT value on done: 8162.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:24,426][63770] Sum rewards: 1.760, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.264', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'AMMO5': '0.015', 'ARMOR': '0.060', 'weapon5': '0.080', 'AMMO3': '0.139', 'WEAPON5': '0.300', 'HITCOUNT': '0.320', 'WEAPON3': '0.800', 'weapon2': '1.472', 'DAMAGECOUNT': '1.635', 'weapon3': '1.960', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:24,614][63732] Updated weights for policy 0, policy_version 1400 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:24,625][63767] DAMAGECOUNT value on done: 7135.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:24,904][63770] DAMAGECOUNT value on done: 5259.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:24,905][63770] Sum rewards: 1.179, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.718', 'AMMO2': '0.011', 'AMMO4': '0.053', 'ARMOR': '0.064', 'AMMO3': '0.125', 'WEAPON4': '0.200', 'weapon4': '0.220', 'HITCOUNT': '0.470', 'WEAPON3': '0.850', 'weapon2': '1.368', 'weapon3': '1.890', 'DAMAGECOUNT': '1.896', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:27,436][63805] DAMAGECOUNT value on done: 8927.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:27,454][63771] DAMAGECOUNT value on done: 4363.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:27,455][63771] Sum rewards: 0.428, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.462', 'AMMO2': '0.004', 'AMMO5': '0.008', 'AMMO4': '0.022', 'WEAPON4': '0.050', 'AMMO3': '0.075', 'weapon5': '0.076', 'weapon4': '0.186', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.450', 'ARMOR': '0.507', 'DAMAGECOUNT': '0.645', 'weapon3': '1.586', 'weapon2': '1.630', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:27,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11264.0, 300 sec: 11080.0). Total num frames: 11276288. Throughput: 0: 1463.9, 1: 1356.3. Samples: 2816299. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:27,460][109198] Avg episode reward: [(0, '-2.340'), (1, '-3.447')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:27,467][63576] Saving new best policy, reward=-3.447!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:27,783][63733] Updated weights for policy 1, policy_version 1350 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:27,809][63771] DAMAGECOUNT value on done: 6916.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:27,810][63771] Sum rewards: -0.823, reward structure: {'DEATHCOUNT': '-9.000', 'AMMO2': '0.014', 'AMMO5': '0.017', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO4': '0.069', 'AMMO3': '0.118', 'weapon5': '0.122', 'weapon4': '0.158', 'HITCOUNT': '0.240', 'HEALTH': '0.246', 'WEAPON5': '0.250', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.110', 'weapon2': '1.528', 'weapon3': '1.590', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:27,813][63805] DAMAGECOUNT value on done: 5495.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:27,813][63805] Sum rewards: -0.665, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.120', 'AMMO2': '0.002', 'AMMO5': '0.010', 'AMMO4': '0.010', 'WEAPON1': '0.030', 'weapon4': '0.074', 'WEAPON4': '0.100', 'AMMO3': '0.121', 'weapon5': '0.146', 'WEAPON5': '0.150', 'HITCOUNT': '0.240', 'ARMOR': '0.445', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.050', 'weapon3': '1.676', 'weapon2': '1.700', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:28,083][63735] DAMAGECOUNT value on done: 7377.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:28,283][63769] DAMAGECOUNT value on done: 7780.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:28,283][63769] Sum rewards: -2.167, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.114', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.020', 'AMMO4': '0.099', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'WEAPON5': '0.150', 'HITCOUNT': '0.160', 'weapon4': '0.162', 'weapon5': '0.234', 'ARMOR': '0.436', 'DAMAGECOUNT': '0.462', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.014', 'weapon2': '1.734'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:28,421][63735] DAMAGECOUNT value on done: 4613.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:28,422][63735] Sum rewards: -1.641, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.740', 'AMMO5': '0.007', 'AMMO2': '0.020', 'WEAPON1': '0.030', 'ARMOR': '0.032', 'AMMO4': '0.098', 'AMMO3': '0.111', 'weapon5': '0.148', 'WEAPON5': '0.150', 'HITCOUNT': '0.200', 'weapon4': '0.238', 'WEAPON4': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.705', 'FRAGCOUNT': '1.000', 'weapon2': '1.466', 'weapon3': '1.594'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:28,674][63769] DAMAGECOUNT value on done: 5760.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:28,810][63806] DAMAGECOUNT value on done: 5027.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:28,811][63806] Sum rewards: -3.113, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.011', 'AMMO5': '0.017', 'WEAPON1': '0.040', 'HITCOUNT': '0.040', 'AMMO4': '0.055', 'AMMO3': '0.067', 'DAMAGECOUNT': '0.090', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.118', 'WEAPON5': '0.300', 'HEALTH': '0.332', 'weapon5': '0.342', 'WEAPON3': '0.400', 'weapon3': '0.912', 'weapon2': '1.112'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:29,150][63806] DAMAGECOUNT value on done: 8363.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:29,150][63806] Sum rewards: 0.655, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.940', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.040', 'AMMO3': '0.068', 'WEAPON4': '0.100', 'HITCOUNT': '0.170', 'weapon4': '0.216', 'WEAPON5': '0.300', 'weapon5': '0.358', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.567', 'FRAGCOUNT': '1.000', 'weapon2': '1.314', 'weapon3': '1.404'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:30,361][63734] DAMAGECOUNT value on done: 6742.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:30,361][63734] Sum rewards: -2.257, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.040', 'AMMO5': '0.005', 'AMMO2': '0.019', 'ARMOR': '0.052', 'AMMO3': '0.080', 'weapon5': '0.084', 'AMMO4': '0.093', 'WEAPON5': '0.100', 'HITCOUNT': '0.210', 'weapon4': '0.238', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.498', 'FRAGCOUNT': '1.000', 'weapon3': '1.342', 'weapon2': '1.862'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:30,760][63734] DAMAGECOUNT value on done: 5459.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:31,350][63732] Updated weights for policy 0, policy_version 1410 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:31,740][63767] DAMAGECOUNT value on done: 8825.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:32,142][63767] DAMAGECOUNT value on done: 8929.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:32,142][63767] Sum rewards: -4.175, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.892', 'ARMOR': '0.005', 'AMMO2': '0.010', 'AMMO5': '0.015', 'AMMO4': '0.051', 'weapon5': '0.132', 'AMMO3': '0.166', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.404', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.125', 'weapon3': '1.422', 'weapon2': '1.456', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:32,458][109198] Fps is (10 sec: 11878.7, 60 sec: 11264.0, 300 sec: 11093.9). Total num frames: 11333632. Throughput: 0: 1454.0, 1: 1366.0. Samples: 2824775. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:32,460][109198] Avg episode reward: [(0, '-2.307'), (1, '-3.310')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:32,461][63576] Saving new best policy, reward=-3.310!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:34,942][63805] DAMAGECOUNT value on done: 8547.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:34,942][63805] Sum rewards: -4.295, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.480', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'ARMOR': '0.012', 'AMMO2': '0.018', 'HITCOUNT': '0.040', 'weapon5': '0.056', 'AMMO4': '0.087', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.105', 'AMMO3': '0.118', 'WEAPON5': '0.150', 'weapon4': '0.184', 'WEAPON3': '0.600', 'weapon3': '1.222', 'weapon2': '1.726'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:35,269][63805] DAMAGECOUNT value on done: 7820.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:35,269][63805] Sum rewards: -1.522, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.790', 'weapon5': '0.014', 'AMMO5': '0.015', 'AMMO2': '0.023', 'ARMOR': '0.080', 'HITCOUNT': '0.110', 'AMMO4': '0.114', 'AMMO3': '0.131', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.285', 'WEAPON4': '0.300', 'weapon4': '0.590', 'WEAPON3': '0.700', 'weapon2': '0.972', 'FRAGCOUNT': '1.000', 'weapon3': '1.534'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:35,406][63733] Updated weights for policy 1, policy_version 1360 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:35,913][63770] DAMAGECOUNT value on done: 6330.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:35,913][63770] Sum rewards: -4.393, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.160', 'AMMO2': '0.002', 'AMMO5': '0.008', 'AMMO4': '0.010', 'ARMOR': '0.012', 'WEAPON1': '0.050', 'WEAPON4': '0.050', 'weapon5': '0.140', 'weapon4': '0.142', 'WEAPON5': '0.150', 'AMMO3': '0.184', 'HITCOUNT': '0.400', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.467', 'weapon2': '1.480', 'FRAGCOUNT': '1.500', 'weapon3': '1.672'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:36,322][63770] DAMAGECOUNT value on done: 6781.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:37,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11332.3, 300 sec: 11107.8). Total num frames: 11390976. Throughput: 0: 1450.3, 1: 1386.2. Samples: 2842221. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:37,459][109198] Avg episode reward: [(0, '-2.292'), (1, '-3.351')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:38,050][63732] Updated weights for policy 0, policy_version 1420 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:38,168][63771] DAMAGECOUNT value on done: 7983.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:38,565][63771] DAMAGECOUNT value on done: 5326.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:38,566][63771] Sum rewards: -4.817, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.180', 'AMMO2': '0.006', 'AMMO5': '0.008', 'WEAPON1': '0.020', 'AMMO4': '0.028', 'ARMOR': '0.036', 'AMMO3': '0.080', 'weapon5': '0.122', 'WEAPON4': '0.150', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'weapon4': '0.292', 'DAMAGECOUNT': '0.471', 'WEAPON3': '0.500', 'weapon3': '1.404', 'weapon2': '1.636'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:40,166][63734] DAMAGECOUNT value on done: 7641.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:40,167][63734] Sum rewards: -3.837, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.970', 'AMMO2': '0.007', 'ARMOR': '0.008', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.035', 'weapon5': '0.044', 'AMMO3': '0.114', 'WEAPON5': '0.150', 'weapon4': '0.214', 'WEAPON4': '0.250', 'HITCOUNT': '0.280', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.846', 'weapon2': '1.548', 'weapon3': '1.604', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:40,514][63734] DAMAGECOUNT value on done: 6625.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:40,515][63734] Sum rewards: -3.042, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.496', 'AMMO2': '0.002', 'AMMO5': '0.003', 'AMMO4': '0.007', 'weapon5': '0.040', 'WEAPON5': '0.050', 'AMMO3': '0.114', 'HITCOUNT': '0.220', 'ARMOR': '0.416', 'DAMAGECOUNT': '0.768', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.286', 'weapon3': '1.998'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:40,542][63806] DAMAGECOUNT value on done: 7442.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:40,542][63806] Sum rewards: 0.809, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.415', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'AMMO5': '0.010', 'AMMO3': '0.067', 'WEAPON4': '0.100', 'weapon5': '0.176', 'HITCOUNT': '0.190', 'WEAPON5': '0.250', 'weapon4': '0.254', 'ARMOR': '0.436', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.876', 'weapon3': '1.242', 'weapon2': '1.380', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:40,913][63806] DAMAGECOUNT value on done: 6725.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:40,914][63806] Sum rewards: -6.061, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.494', 'AMMO5': '0.012', 'AMMO2': '0.016', 'AMMO4': '0.080', 'ARMOR': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.145', 'WEAPON4': '0.150', 'weapon5': '0.180', 'WEAPON5': '0.250', 'weapon4': '0.294', 'DAMAGECOUNT': '0.387', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.800', 'weapon2': '1.160', 'weapon3': '1.468'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:42,458][109198] Fps is (10 sec: 11468.6, 60 sec: 11400.6, 300 sec: 11107.8). Total num frames: 11448320. Throughput: 0: 1453.6, 1: 1393.1. Samples: 2859489. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:42,460][109198] Avg episode reward: [(0, '-2.251'), (1, '-3.352')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:42,784][63735] DAMAGECOUNT value on done: 7256.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:42,785][63735] Sum rewards: -4.269, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.296', 'AMMO5': '0.012', 'AMMO2': '0.024', 'weapon5': '0.036', 'HITCOUNT': '0.100', 'AMMO4': '0.118', 'AMMO3': '0.142', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.243', 'WEAPON5': '0.250', 'weapon4': '0.292', 'ARMOR': '0.464', 'WEAPON3': '0.650', 'weapon3': '0.714', 'FRAGCOUNT': '1.000', 'weapon2': '1.832'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:42,936][63733] Updated weights for policy 1, policy_version 1370 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:43,100][63735] DAMAGECOUNT value on done: 7205.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:44,055][63769] DAMAGECOUNT value on done: 7170.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:44,056][63769] Sum rewards: 1.978, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.490', 'AMMO2': '0.012', 'AMMO5': '0.013', 'AMMO4': '0.062', 'ARMOR': '0.080', 'AMMO3': '0.101', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'weapon4': '0.228', 'HITCOUNT': '0.360', 'WEAPON3': '0.700', 'weapon2': '1.254', 'DAMAGECOUNT': '1.305', 'weapon3': '1.552', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:44,411][63769] DAMAGECOUNT value on done: 7154.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:44,411][63769] Sum rewards: -8.196, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.550', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.007', 'AMMO2': '0.030', 'ARMOR': '0.051', 'HITCOUNT': '0.100', 'weapon5': '0.116', 'AMMO3': '0.127', 'WEAPON5': '0.150', 'AMMO4': '0.152', 'weapon4': '0.294', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.378', 'WEAPON3': '0.800', 'weapon2': '1.154', 'weapon3': '1.694'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:44,696][63732] Updated weights for policy 0, policy_version 1430 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:47,062][63767] DAMAGECOUNT value on done: 7844.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:47,446][63767] DAMAGECOUNT value on done: 7205.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:47,458][109198] Fps is (10 sec: 11878.3, 60 sec: 11468.8, 300 sec: 11121.7). Total num frames: 11509760. Throughput: 0: 1456.3, 1: 1395.4. Samples: 2868268. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:47,460][109198] Avg episode reward: [(0, '-2.231'), (1, '-3.365')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:49,761][63770] DAMAGECOUNT value on done: 8367.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:49,762][63770] Sum rewards: -5.902, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.002', 'AMMO2': '0.002', 'AMMO5': '0.003', 'AMMO4': '0.009', 'WEAPON5': '0.050', 'weapon5': '0.064', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'AMMO3': '0.189', 'weapon4': '0.198', 'DAMAGECOUNT': '0.615', 'WEAPON3': '0.900', 'weapon3': '1.244', 'weapon2': '1.776', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:49,980][63805] DAMAGECOUNT value on done: 9157.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:49,981][63805] Sum rewards: 4.400, reward structure: {'DEATHCOUNT': '-2.250', 'AMMO4': '-0.014', 'AMMO2': '-0.003', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.050', 'HEALTH': '0.120', 'WEAPON3': '0.200', 'HITCOUNT': '0.200', 'ARMOR': '0.458', 'DAMAGECOUNT': '0.690', 'weapon2': '0.850', 'weapon3': '1.046', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:50,161][63770] DAMAGECOUNT value on done: 5688.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:50,161][63770] Sum rewards: 1.116, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.743', 'AMMO5': '0.005', 'AMMO2': '0.011', 'weapon5': '0.042', 'WEAPON1': '0.050', 'AMMO4': '0.055', 'WEAPON5': '0.100', 'AMMO3': '0.101', 'WEAPON4': '0.150', 'weapon4': '0.216', 'HITCOUNT': '0.380', 'WEAPON3': '0.600', 'weapon2': '1.224', 'DAMAGECOUNT': '1.287', 'weapon3': '1.888', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:50,290][63733] Updated weights for policy 1, policy_version 1380 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:50,322][63735] DAMAGECOUNT value on done: 7532.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:50,374][63805] DAMAGECOUNT value on done: 5885.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:50,374][63805] Sum rewards: -2.421, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.042', 'AMMO2': '0.002', 'AMMO4': '0.009', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'weapon5': '0.028', 'WEAPON4': '0.100', 'AMMO3': '0.117', 'weapon4': '0.236', 'WEAPON5': '0.250', 'HITCOUNT': '0.310', 'ARMOR': '0.432', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.170', 'weapon2': '1.460', 'weapon3': '1.720', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:50,512][63771] DAMAGECOUNT value on done: 4728.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:50,513][63771] Sum rewards: 0.831, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.907', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.023', 'ARMOR': '0.040', 'AMMO3': '0.076', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.116', 'weapon5': '0.138', 'weapon4': '0.158', 'HITCOUNT': '0.260', 'WEAPON3': '0.450', 'DAMAGECOUNT': '1.095', 'weapon3': '1.390', 'FRAGCOUNT': '1.500', 'weapon2': '1.528'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:50,628][63735] DAMAGECOUNT value on done: 4813.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:50,628][63735] Sum rewards: -0.656, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.395', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO2': '0.024', 'weapon5': '0.078', 'AMMO3': '0.098', 'AMMO4': '0.118', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon4': '0.214', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.600', 'weapon2': '1.210', 'weapon3': '1.870', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:50,921][63771] DAMAGECOUNT value on done: 7206.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:50,922][63771] Sum rewards: -1.328, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.058', 'weapon5': '0.008', 'AMMO2': '0.011', 'AMMO5': '0.015', 'ARMOR': '0.036', 'AMMO4': '0.056', 'AMMO3': '0.078', 'weapon7': '0.102', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.240', 'WEAPON4': '0.250', 'weapon4': '0.306', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.870', 'FRAGCOUNT': '1.000', 'weapon3': '1.036', 'weapon2': '1.382'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:51,252][63769] DAMAGECOUNT value on done: 7991.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:51,253][63769] Sum rewards: -2.830, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.742', 'AMMO2': '0.002', 'ARMOR': '0.004', 'AMMO4': '0.009', 'AMMO3': '0.102', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'weapon4': '0.196', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.633', 'weapon3': '1.432', 'weapon2': '1.954', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:51,439][63732] Updated weights for policy 0, policy_version 1440 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:51,459][63806] DAMAGECOUNT value on done: 5402.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:51,459][63806] Sum rewards: 0.199, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.324', 'AMMO2': '0.004', 'weapon5': '0.012', 'AMMO5': '0.015', 'AMMO4': '0.020', 'WEAPON1': '0.040', 'WEAPON4': '0.100', 'AMMO3': '0.139', 'weapon4': '0.148', 'WEAPON5': '0.300', 'HITCOUNT': '0.330', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.125', 'weapon2': '1.334', 'weapon3': '1.806', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:51,588][63769] DAMAGECOUNT value on done: 5956.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:51,589][63769] Sum rewards: 1.154, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.772', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO2': '0.031', 'AMMO3': '0.092', 'HITCOUNT': '0.150', 'AMMO4': '0.154', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'weapon4': '0.296', 'weapon5': '0.372', 'DAMAGECOUNT': '0.588', 'WEAPON3': '0.650', 'ARMOR': '0.988', 'weapon2': '1.072', 'weapon3': '1.798', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:51,777][63806] DAMAGECOUNT value on done: 8463.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:52,458][109198] Fps is (10 sec: 11469.0, 60 sec: 11400.5, 300 sec: 11121.7). Total num frames: 11563008. Throughput: 0: 1468.8, 1: 1394.8. Samples: 2885580. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:52,460][109198] Avg episode reward: [(0, '-2.283'), (1, '-3.056')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:52,461][63576] Saving new best policy, reward=-3.056!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:54,811][63767] DAMAGECOUNT value on done: 9060.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:54,812][63767] Sum rewards: -2.013, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.216', 'AMMO5': '0.007', 'AMMO2': '0.015', 'WEAPON1': '0.020', 'weapon5': '0.048', 'AMMO4': '0.075', 'ARMOR': '0.104', 'AMMO3': '0.108', 'WEAPON5': '0.150', 'HITCOUNT': '0.220', 'WEAPON4': '0.300', 'weapon4': '0.560', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.705', 'FRAGCOUNT': '1.000', 'weapon2': '1.138', 'weapon3': '1.402'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:55,189][63767] DAMAGECOUNT value on done: 9138.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:55,189][63767] Sum rewards: -7.100, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.426', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO2': '0.031', 'ARMOR': '0.040', 'WEAPON5': '0.100', 'AMMO3': '0.118', 'AMMO4': '0.153', 'HITCOUNT': '0.200', 'WEAPON4': '0.400', 'weapon4': '0.528', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.627', 'weapon3': '1.116', 'weapon2': '1.402'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:55,503][63734] DAMAGECOUNT value on done: 7171.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:55,503][63734] Sum rewards: 2.022, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.632', 'AMMO4': '-0.003', 'AMMO2': '-0.000', 'AMMO5': '0.003', 'AMMO3': '0.099', 'WEAPON5': '0.100', 'weapon5': '0.142', 'WEAPON4': '0.150', 'HITCOUNT': '0.210', 'weapon4': '0.398', 'ARMOR': '0.452', 'WEAPON3': '0.500', 'weapon3': '1.206', 'DAMAGECOUNT': '1.287', 'weapon2': '1.610', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:55,910][63734] DAMAGECOUNT value on done: 5680.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:55,911][63734] Sum rewards: -3.830, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.392', 'AMMO5': '0.007', 'AMMO2': '0.013', 'weapon5': '0.048', 'WEAPON1': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.062', 'weapon4': '0.102', 'AMMO3': '0.124', 'WEAPON5': '0.150', 'HITCOUNT': '0.180', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.663', 'ARMOR': '0.884', 'FRAGCOUNT': '1.000', 'weapon3': '1.424', 'weapon2': '1.654'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:57,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11400.5, 300 sec: 11121.7). Total num frames: 11620352. Throughput: 0: 1494.2, 1: 1378.1. Samples: 2902820. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:53:57,460][109198] Avg episode reward: [(0, '-2.304'), (1, '-3.070')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:57,864][63805] DAMAGECOUNT value on done: 8597.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:58,037][63733] Updated weights for policy 1, policy_version 1390 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:58,160][63732] Updated weights for policy 0, policy_version 1450 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:58,244][63805] DAMAGECOUNT value on done: 8286.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:53:58,245][63805] Sum rewards: -0.269, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.424', 'AMMO5': '0.005', 'AMMO2': '0.017', 'WEAPON5': '0.050', 'ARMOR': '0.068', 'AMMO4': '0.085', 'AMMO3': '0.099', 'weapon5': '0.118', 'WEAPON4': '0.200', 'HITCOUNT': '0.250', 'weapon4': '0.264', 'WEAPON3': '0.650', 'weapon2': '1.018', 'DAMAGECOUNT': '1.398', 'weapon3': '1.682', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:01,210][63771] DAMAGECOUNT value on done: 8278.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:01,210][63771] Sum rewards: -2.753, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.166', 'AMMO5': '0.007', 'WEAPON1': '0.030', 'ARMOR': '0.032', 'AMMO2': '0.034', 'weapon4': '0.084', 'AMMO3': '0.137', 'WEAPON5': '0.150', 'AMMO4': '0.169', 'HITCOUNT': '0.200', 'weapon5': '0.206', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.885', 'weapon2': '0.898', 'WEAPON3': '0.900', 'FRAGCOUNT': '2.000', 'weapon3': '2.180'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:01,325][63770] DAMAGECOUNT value on done: 6390.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:01,326][63770] Sum rewards: -3.123, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.542', 'AMMO2': '0.010', 'AMMO5': '0.010', 'weapon5': '0.022', 'AMMO4': '0.049', 'HITCOUNT': '0.050', 'ARMOR': '0.068', 'AMMO3': '0.114', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.180', 'WEAPON4': '0.250', 'weapon4': '0.394', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.278', 'weapon3': '1.594'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:01,550][63771] DAMAGECOUNT value on done: 5536.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:01,550][63771] Sum rewards: -3.346, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.256', 'AMMO5': '0.007', 'weapon5': '0.018', 'AMMO2': '0.035', 'WEAPON1': '0.060', 'AMMO3': '0.126', 'WEAPON5': '0.150', 'HITCOUNT': '0.160', 'AMMO4': '0.177', 'weapon4': '0.276', 'WEAPON4': '0.400', 'ARMOR': '0.419', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.750', 'weapon2': '1.498', 'weapon3': '1.702', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:01,770][63770] DAMAGECOUNT value on done: 7061.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:01,771][63770] Sum rewards: 0.121, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-1.390', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.012', 'weapon5': '0.070', 'AMMO3': '0.078', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.206', 'HITCOUNT': '0.210', 'ARMOR': '0.500', 'WEAPON3': '0.550', 'weapon2': '0.724', 'DAMAGECOUNT': '0.840', 'FRAGCOUNT': '1.000', 'weapon3': '1.508'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:02,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11468.8, 300 sec: 11135.6). Total num frames: 11677696. Throughput: 0: 1505.8, 1: 1368.5. Samples: 2911480. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:02,460][109198] Avg episode reward: [(0, '-2.242'), (1, '-3.074')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:03,055][63806] DAMAGECOUNT value on done: 7712.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:03,055][63806] Sum rewards: -5.423, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.916', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.010', 'ARMOR': '0.017', 'AMMO2': '0.020', 'WEAPON1': '0.020', 'AMMO4': '0.099', 'WEAPON5': '0.150', 'AMMO3': '0.153', 'HITCOUNT': '0.180', 'weapon5': '0.186', 'WEAPON4': '0.300', 'weapon4': '0.368', 'DAMAGECOUNT': '0.810', 'WEAPON3': '0.950', 'weapon2': '1.184', 'weapon3': '1.546'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:03,373][63806] DAMAGECOUNT value on done: 7130.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:03,373][63806] Sum rewards: -1.011, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.790', 'AMMO2': '0.012', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'AMMO4': '0.059', 'AMMO3': '0.105', 'weapon5': '0.118', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'HITCOUNT': '0.260', 'weapon4': '0.274', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.650', 'weapon2': '1.154', 'DAMAGECOUNT': '1.215', 'weapon3': '1.710'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:03,746][63734] DAMAGECOUNT value on done: 8004.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:03,747][63734] Sum rewards: -5.254, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.700', 'AMMO5': '0.009', 'ARMOR': '0.012', 'AMMO2': '0.014', 'WEAPON1': '0.020', 'weapon7': '0.040', 'weapon5': '0.068', 'AMMO4': '0.068', 'AMMO6': '0.160', 'AMMO7': '0.160', 'AMMO3': '0.170', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.240', 'WEAPON4': '0.250', 'weapon4': '0.338', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.089', 'weapon3': '1.336', 'weapon2': '1.472'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:04,143][63734] DAMAGECOUNT value on done: 7247.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:04,144][63734] Sum rewards: 0.334, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.188', 'AMMO2': '0.010', 'AMMO5': '0.022', 'WEAPON4': '0.050', 'ARMOR': '0.052', 'AMMO4': '0.052', 'weapon4': '0.068', 'AMMO3': '0.126', 'WEAPON5': '0.200', 'HITCOUNT': '0.340', 'weapon5': '0.398', 'WEAPON3': '0.600', 'weapon3': '1.426', 'weapon2': '1.560', 'DAMAGECOUNT': '1.866', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:04,844][63732] Updated weights for policy 0, policy_version 1460 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:05,119][63735] DAMAGECOUNT value on done: 7579.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:05,119][63735] Sum rewards: 1.333, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.636', 'AMMO4': '-0.008', 'AMMO2': '-0.001', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.048', 'weapon5': '0.050', 'AMMO3': '0.106', 'WEAPON4': '0.150', 'HITCOUNT': '0.290', 'weapon4': '0.316', 'WEAPON5': '0.350', 'WEAPON3': '0.750', 'weapon2': '0.808', 'DAMAGECOUNT': '0.969', 'weapon3': '2.104', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:05,452][63735] DAMAGECOUNT value on done: 7559.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:05,453][63735] Sum rewards: -0.978, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.210', 'AMMO2': '0.000', 'AMMO4': '0.000', 'AMMO5': '0.013', 'weapon7': '0.018', 'AMMO3': '0.091', 'weapon5': '0.170', 'WEAPON4': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'weapon4': '0.360', 'WEAPON3': '0.700', 'ARMOR': '0.997', 'DAMAGECOUNT': '1.062', 'weapon2': '1.274', 'weapon3': '1.506', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:05,458][63733] Updated weights for policy 1, policy_version 1400 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:07,281][63769] DAMAGECOUNT value on done: 7568.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:07,282][63769] Sum rewards: 4.148, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.115', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.021', 'weapon5': '0.056', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.103', 'AMMO3': '0.108', 'weapon7': '0.154', 'WEAPON4': '0.250', 'HITCOUNT': '0.290', 'ARMOR': '0.476', 'weapon4': '0.530', 'WEAPON3': '0.600', 'weapon2': '1.170', 'DAMAGECOUNT': '1.194', 'weapon3': '1.396', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:07,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11468.8, 300 sec: 11135.6). Total num frames: 11735040. Throughput: 0: 1523.4, 1: 1357.9. Samples: 2928782. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:07,460][109198] Avg episode reward: [(0, '-2.194'), (1, '-3.074')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:07,684][63769] DAMAGECOUNT value on done: 7229.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:07,684][63769] Sum rewards: -3.545, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.936', 'AMMO2': '0.016', 'AMMO5': '0.022', 'HITCOUNT': '0.070', 'AMMO4': '0.081', 'AMMO3': '0.120', 'weapon5': '0.150', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.225', 'WEAPON5': '0.300', 'ARMOR': '0.400', 'weapon4': '0.414', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.166', 'weapon2': '1.476'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:10,153][63767] DAMAGECOUNT value on done: 8436.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:10,153][63767] Sum rewards: -0.186, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.143', 'AMMO4': '-0.018', 'AMMO2': '-0.003', 'ARMOR': '0.072', 'AMMO3': '0.192', 'HITCOUNT': '0.490', 'WEAPON3': '1.000', 'weapon2': '1.590', 'weapon3': '1.608', 'DAMAGECOUNT': '1.776', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:10,503][63767] DAMAGECOUNT value on done: 7410.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:11,690][63732] Updated weights for policy 0, policy_version 1470 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:12,458][109198] Fps is (10 sec: 11878.4, 60 sec: 11537.1, 300 sec: 11149.5). Total num frames: 11796480. Throughput: 0: 1521.5, 1: 1355.2. Samples: 2945748. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:12,460][109198] Avg episode reward: [(0, '-2.228'), (1, '-3.046')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:12,461][63576] Saving new best policy, reward=-3.046!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:12,740][63735] DAMAGECOUNT value on done: 7827.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:12,741][63735] Sum rewards: -1.743, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.264', 'AMMO5': '0.015', 'AMMO2': '0.016', 'weapon4': '0.058', 'AMMO4': '0.081', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.130', 'HITCOUNT': '0.210', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.885', 'weapon3': '1.692', 'weapon2': '1.934', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:12,892][63805] DAMAGECOUNT value on done: 9562.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:12,893][63805] Sum rewards: -0.313, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.112', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.015', 'ARMOR': '0.052', 'AMMO4': '0.075', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.110', 'weapon5': '0.132', 'weapon4': '0.210', 'HITCOUNT': '0.230', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.215', 'weapon2': '1.228', 'weapon3': '1.716', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:13,088][63735] DAMAGECOUNT value on done: 5113.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:13,088][63735] Sum rewards: -2.378, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.049', 'ARMOR': '0.008', 'AMMO5': '0.015', 'AMMO2': '0.016', 'WEAPON1': '0.040', 'AMMO4': '0.081', 'AMMO3': '0.144', 'weapon5': '0.150', 'WEAPON4': '0.200', 'weapon4': '0.202', 'HITCOUNT': '0.270', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.900', 'weapon2': '0.936', 'WEAPON3': '0.950', 'FRAGCOUNT': '2.000', 'weapon3': '2.208'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:13,182][63733] Updated weights for policy 1, policy_version 1410 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:13,296][63805] DAMAGECOUNT value on done: 6285.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:13,297][63805] Sum rewards: -4.553, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.512', 'weapon5': '0.004', 'AMMO5': '0.013', 'AMMO2': '0.021', 'WEAPON1': '0.080', 'AMMO4': '0.105', 'AMMO3': '0.114', 'WEAPON5': '0.250', 'HITCOUNT': '0.270', 'WEAPON4': '0.300', 'ARMOR': '0.436', 'WEAPON3': '0.700', 'weapon4': '0.722', 'DAMAGECOUNT': '1.200', 'weapon3': '1.222', 'weapon2': '1.272', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:13,772][63806] DAMAGECOUNT value on done: 5694.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:13,772][63806] Sum rewards: -2.164, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.613', 'WEAPON1': '0.010', 'AMMO2': '0.016', 'AMMO5': '0.018', 'ARMOR': '0.052', 'AMMO4': '0.081', 'AMMO3': '0.108', 'weapon5': '0.146', 'WEAPON4': '0.200', 'HITCOUNT': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.340', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.876', 'FRAGCOUNT': '1.000', 'weapon2': '1.040', 'weapon3': '1.712'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:13,969][63771] DAMAGECOUNT value on done: 5058.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:13,969][63771] Sum rewards: -3.800, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.798', 'AMMO2': '0.000', 'AMMO4': '0.001', 'weapon7': '0.002', 'AMMO5': '0.012', 'weapon5': '0.018', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.150', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.990', 'weapon2': '1.526', 'weapon3': '1.888', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:14,174][63806] DAMAGECOUNT value on done: 8628.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:14,175][63806] Sum rewards: -6.068, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.910', 'AMMO2': '0.003', 'AMMO4': '0.013', 'AMMO5': '0.015', 'ARMOR': '0.032', 'AMMO3': '0.110', 'HITCOUNT': '0.110', 'weapon5': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.388', 'weapon3': '1.926'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:14,338][63771] DAMAGECOUNT value on done: 7356.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:14,339][63771] Sum rewards: -4.200, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.630', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.010', 'AMMO2': '0.016', 'ARMOR': '0.032', 'AMMO4': '0.080', 'weapon5': '0.082', 'AMMO3': '0.146', 'HITCOUNT': '0.150', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon4': '0.412', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.750', 'weapon3': '1.338', 'weapon2': '1.464'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:14,374][63769] DAMAGECOUNT value on done: 8369.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:14,374][63769] Sum rewards: -0.367, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.000', 'WEAPON1': '0.010', 'AMMO2': '0.012', 'AMMO5': '0.012', 'AMMO4': '0.058', 'weapon7': '0.076', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.130', 'WEAPON4': '0.150', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'HITCOUNT': '0.330', 'weapon4': '0.362', 'ARMOR': '0.449', 'WEAPON3': '0.800', 'weapon2': '1.110', 'DAMAGECOUNT': '1.134', 'weapon3': '1.810', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:14,790][63769] DAMAGECOUNT value on done: 6191.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:14,790][63769] Sum rewards: -5.911, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.882', 'AMMO2': '0.004', 'AMMO5': '0.010', 'AMMO4': '0.017', 'WEAPON1': '0.020', 'weapon5': '0.028', 'AMMO3': '0.120', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'weapon4': '0.264', 'ARMOR': '0.521', 'DAMAGECOUNT': '0.705', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.468', 'weapon3': '1.654'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:15,224][63770] DAMAGECOUNT value on done: 8755.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:15,225][63770] Sum rewards: 2.619, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.830', 'AMMO2': '0.011', 'AMMO4': '0.055', 'ARMOR': '0.090', 'AMMO3': '0.106', 'WEAPON4': '0.250', 'HITCOUNT': '0.280', 'weapon4': '0.530', 'WEAPON3': '0.650', 'weapon2': '0.662', 'DAMAGECOUNT': '1.164', 'weapon3': '1.900', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:15,651][63770] DAMAGECOUNT value on done: 6048.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:15,651][63770] Sum rewards: -0.538, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.906', 'AMMO2': '0.011', 'AMMO5': '0.018', 'WEAPON1': '0.040', 'weapon5': '0.046', 'AMMO4': '0.052', 'AMMO3': '0.091', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'weapon4': '0.318', 'WEAPON3': '0.650', 'weapon2': '0.962', 'DAMAGECOUNT': '1.080', 'weapon3': '1.770', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:17,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11468.8, 300 sec: 11149.5). Total num frames: 11849728. Throughput: 0: 1519.4, 1: 1354.2. Samples: 2954089. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:17,460][109198] Avg episode reward: [(0, '-2.239'), (1, '-2.917')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:17,467][63576] Saving new best policy, reward=-2.917!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:18,393][63767] DAMAGECOUNT value on done: 9275.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:18,393][63767] Sum rewards: -2.343, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.718', 'AMMO5': '0.008', 'WEAPON1': '0.010', 'weapon5': '0.032', 'AMMO2': '0.035', 'ARMOR': '0.092', 'weapon4': '0.104', 'AMMO3': '0.112', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'AMMO4': '0.175', 'WEAPON4': '0.300', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.645', 'weapon2': '1.286', 'weapon3': '1.706'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:18,582][63732] Updated weights for policy 0, policy_version 1480 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:18,774][63767] DAMAGECOUNT value on done: 9306.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:18,775][63767] Sum rewards: -2.750, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.486', 'AMMO5': '0.008', 'AMMO2': '0.012', 'AMMO4': '0.060', 'ARMOR': '0.068', 'AMMO3': '0.103', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'weapon5': '0.194', 'weapon4': '0.380', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.504', 'FRAGCOUNT': '1.000', 'weapon3': '1.240', 'weapon2': '1.476'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:20,777][63733] Updated weights for policy 1, policy_version 1420 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:21,084][63734] DAMAGECOUNT value on done: 7440.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:21,084][63734] Sum rewards: -5.615, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.840', 'AMMO5': '0.010', 'AMMO2': '0.035', 'weapon5': '0.050', 'ARMOR': '0.072', 'AMMO3': '0.137', 'WEAPON5': '0.150', 'AMMO4': '0.174', 'HITCOUNT': '0.200', 'WEAPON4': '0.350', 'weapon4': '0.496', 'DAMAGECOUNT': '0.807', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.142', 'weapon3': '1.252'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:21,156][63805] DAMAGECOUNT value on done: 8760.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:21,156][63805] Sum rewards: -3.665, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.482', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.008', 'weapon5': '0.050', 'WEAPON4': '0.100', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'weapon4': '0.154', 'AMMO3': '0.164', 'DAMAGECOUNT': '0.489', 'weapon2': '0.996', 'WEAPON3': '1.000', 'weapon3': '2.052', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:21,547][63734] DAMAGECOUNT value on done: 5904.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:21,548][63734] Sum rewards: -4.988, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.704', 'ARMOR': '0.008', 'AMMO2': '0.028', 'AMMO3': '0.123', 'AMMO4': '0.139', 'HITCOUNT': '0.180', 'WEAPON4': '0.250', 'weapon4': '0.374', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.672', 'FRAGCOUNT': '1.000', 'weapon3': '1.360', 'weapon2': '1.432'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:21,560][63805] DAMAGECOUNT value on done: 8641.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:22,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11537.1, 300 sec: 11149.4). Total num frames: 11907072. Throughput: 0: 1516.7, 1: 1351.4. Samples: 2971289. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:22,460][109198] Avg episode reward: [(0, '-2.379'), (1, '-2.926')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:24,370][63771] DAMAGECOUNT value on done: 8783.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:24,371][63771] Sum rewards: -1.387, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.533', 'WEAPON1': '0.010', 'AMMO2': '0.014', 'AMMO5': '0.018', 'weapon5': '0.020', 'ARMOR': '0.036', 'AMMO4': '0.071', 'AMMO3': '0.138', 'WEAPON4': '0.150', 'weapon4': '0.270', 'WEAPON5': '0.350', 'HITCOUNT': '0.360', 'WEAPON3': '0.700', 'weapon2': '1.372', 'weapon3': '1.372', 'DAMAGECOUNT': '1.515', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:24,777][63771] DAMAGECOUNT value on done: 5977.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:24,777][63771] Sum rewards: -3.170, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.046', 'weapon5': '0.008', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.010', 'AMMO4': '0.051', 'ARMOR': '0.060', 'AMMO3': '0.169', 'WEAPON5': '0.200', 'HITCOUNT': '0.340', 'WEAPON3': '0.950', 'weapon2': '1.216', 'DAMAGECOUNT': '1.323', 'weapon3': '2.028', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:25,337][63732] Updated weights for policy 0, policy_version 1490 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:26,077][63806] DAMAGECOUNT value on done: 7966.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:26,078][63806] Sum rewards: -2.565, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.965', 'AMMO2': '0.037', 'AMMO3': '0.112', 'ARMOR': '0.112', 'AMMO4': '0.183', 'HITCOUNT': '0.200', 'weapon4': '0.334', 'WEAPON4': '0.350', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.762', 'FRAGCOUNT': '1.000', 'weapon2': '1.092', 'weapon3': '1.768'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:26,417][63806] DAMAGECOUNT value on done: 7300.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:26,418][63806] Sum rewards: -3.575, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.224', 'AMMO5': '0.003', 'weapon5': '0.016', 'AMMO2': '0.030', 'WEAPON5': '0.050', 'ARMOR': '0.060', 'AMMO3': '0.068', 'HITCOUNT': '0.120', 'AMMO4': '0.152', 'WEAPON3': '0.250', 'WEAPON4': '0.450', 'DAMAGECOUNT': '0.510', 'weapon4': '0.640', 'weapon3': '0.838', 'FRAGCOUNT': '1.000', 'weapon2': '1.712'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:26,752][63770] DAMAGECOUNT value on done: 6799.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:26,753][63770] Sum rewards: -3.486, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.135', 'weapon7': '0.010', 'AMMO2': '0.010', 'AMMO5': '0.023', 'weapon4': '0.026', 'AMMO4': '0.052', 'WEAPON4': '0.100', 'AMMO3': '0.177', 'weapon5': '0.186', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.350', 'WEAPON5': '0.450', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.227', 'weapon3': '1.498', 'weapon2': '1.690', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:27,140][63770] DAMAGECOUNT value on done: 7146.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:27,140][63770] Sum rewards: -7.135, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.966', 'AMMO2': '0.002', 'WEAPON1': '0.010', 'AMMO4': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.032', 'weapon5': '0.060', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'AMMO3': '0.106', 'weapon4': '0.112', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.128', 'weapon2': '1.560'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:27,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11468.8, 300 sec: 11149.5). Total num frames: 11964416. Throughput: 0: 1515.4, 1: 1351.4. Samples: 2988493. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:27,460][109198] Avg episode reward: [(0, '-2.473'), (1, '-2.920')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:27,467][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001428_5849088.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:27,469][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001493_6115328.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:27,526][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001132_4636672.pth\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:27,527][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001135_4648960.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:27,702][63734] DAMAGECOUNT value on done: 8189.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:27,702][63734] Sum rewards: -1.994, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.598', 'AMMO5': '0.005', 'AMMO2': '0.007', 'ARMOR': '0.028', 'AMMO4': '0.037', 'weapon7': '0.076', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.106', 'HITCOUNT': '0.120', 'weapon4': '0.184', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.650', 'weapon3': '1.314', 'weapon2': '1.422', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:28,074][63735] DAMAGECOUNT value on done: 7719.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:28,092][63734] DAMAGECOUNT value on done: 7404.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:28,093][63734] Sum rewards: -2.082, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.507', 'weapon7': '0.002', 'AMMO5': '0.012', 'AMMO2': '0.013', 'ARMOR': '0.032', 'AMMO4': '0.065', 'weapon5': '0.106', 'AMMO3': '0.133', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'WEAPON4': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon4': '0.320', 'DAMAGECOUNT': '0.471', 'WEAPON3': '0.750', 'weapon2': '0.838', 'FRAGCOUNT': '1.000', 'weapon3': '1.812'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:28,352][63733] Updated weights for policy 1, policy_version 1430 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:28,416][63735] DAMAGECOUNT value on done: 7824.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:28,416][63735] Sum rewards: -2.896, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.182', 'AMMO4': '-0.044', 'AMMO2': '-0.009', 'AMMO5': '0.010', 'WEAPON4': '0.100', 'AMMO3': '0.101', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.228', 'ARMOR': '0.535', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.795', 'FRAGCOUNT': '1.000', 'weapon3': '1.412', 'weapon2': '1.508'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:30,860][63769] DAMAGECOUNT value on done: 7703.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:30,861][63769] Sum rewards: -6.887, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.075', 'AMMO5': '0.017', 'AMMO2': '0.020', 'weapon5': '0.046', 'AMMO4': '0.097', 'HITCOUNT': '0.110', 'AMMO3': '0.137', 'WEAPON5': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.800', 'weapon2': '1.368', 'weapon3': '1.652'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:31,211][63769] DAMAGECOUNT value on done: 7393.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:31,212][63769] Sum rewards: -4.140, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.255', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'AMMO5': '0.008', 'ARMOR': '0.036', 'AMMO3': '0.134', 'HITCOUNT': '0.140', 'weapon5': '0.246', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.492', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.192', 'weapon3': '1.786'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:32,099][63732] Updated weights for policy 0, policy_version 1500 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:32,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11468.8, 300 sec: 11163.3). Total num frames: 12021760. Throughput: 0: 1512.3, 1: 1350.7. Samples: 2997103. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:32,460][109198] Avg episode reward: [(0, '-2.627'), (1, '-2.920')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:33,203][63767] DAMAGECOUNT value on done: 8725.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:33,203][63767] Sum rewards: -2.800, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.530', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.015', 'AMMO4': '0.075', 'AMMO3': '0.137', 'weapon5': '0.194', 'WEAPON5': '0.200', 'HITCOUNT': '0.240', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.867', 'FRAGCOUNT': '1.000', 'weapon2': '1.282', 'weapon3': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:33,537][63767] DAMAGECOUNT value on done: 7597.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:33,538][63767] Sum rewards: -5.962, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.360', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.014', 'weapon5': '0.056', 'AMMO4': '0.067', 'AMMO3': '0.128', 'HITCOUNT': '0.160', 'WEAPON5': '0.250', 'WEAPON4': '0.350', 'weapon4': '0.440', 'DAMAGECOUNT': '0.561', 'WEAPON3': '0.650', 'weapon2': '1.338', 'weapon3': '1.362', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:35,196][63735] DAMAGECOUNT value on done: 7972.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:35,197][63735] Sum rewards: -2.193, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.332', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO4': '0.021', 'ARMOR': '0.060', 'AMMO3': '0.091', 'HITCOUNT': '0.100', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.435', 'weapon4': '0.502', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.218', 'weapon3': '1.498'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:35,555][63735] DAMAGECOUNT value on done: 5481.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:35,556][63735] Sum rewards: 1.275, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.672', 'AMMO5': '0.003', 'AMMO2': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.048', 'WEAPON5': '0.050', 'AMMO3': '0.086', 'AMMO4': '0.087', 'weapon5': '0.192', 'WEAPON4': '0.200', 'HITCOUNT': '0.200', 'weapon4': '0.312', 'WEAPON3': '0.450', 'DAMAGECOUNT': '1.104', 'weapon3': '1.214', 'weapon2': '1.464', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:35,689][63805] DAMAGECOUNT value on done: 9896.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:35,689][63805] Sum rewards: -1.017, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-2.290', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.013', 'WEAPON1': '0.020', 'ARMOR': '0.064', 'weapon5': '0.082', 'AMMO3': '0.098', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'weapon4': '0.348', 'WEAPON3': '0.450', 'weapon3': '0.782', 'DAMAGECOUNT': '1.002', 'weapon2': '1.772', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:35,825][63733] Updated weights for policy 1, policy_version 1440 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:36,073][63805] DAMAGECOUNT value on done: 6578.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:36,074][63805] Sum rewards: -0.336, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.325', 'ARMOR': '0.012', 'AMMO5': '0.018', 'AMMO2': '0.020', 'weapon4': '0.040', 'WEAPON1': '0.050', 'weapon5': '0.056', 'AMMO3': '0.082', 'WEAPON4': '0.100', 'AMMO4': '0.102', 'HITCOUNT': '0.280', 'WEAPON5': '0.350', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.879', 'weapon3': '1.370', 'weapon2': '1.830', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:36,293][63806] DAMAGECOUNT value on done: 5994.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:36,293][63806] Sum rewards: -2.221, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.840', 'AMMO2': '0.009', 'AMMO5': '0.013', 'AMMO4': '0.043', 'ARMOR': '0.056', 'AMMO3': '0.098', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon5': '0.164', 'HITCOUNT': '0.190', 'weapon4': '0.202', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.900', 'weapon2': '1.030', 'weapon3': '1.864', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:36,662][63806] DAMAGECOUNT value on done: 8855.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:36,662][63806] Sum rewards: -5.646, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.924', 'AMMO2': '0.008', 'ARMOR': '0.032', 'AMMO4': '0.037', 'WEAPON4': '0.100', 'AMMO3': '0.106', 'weapon4': '0.150', 'HITCOUNT': '0.160', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.681', 'FRAGCOUNT': '1.000', 'weapon3': '1.390', 'weapon2': '1.714'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:37,445][63769] DAMAGECOUNT value on done: 8731.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:37,458][109198] Fps is (10 sec: 11878.4, 60 sec: 11537.1, 300 sec: 11177.2). Total num frames: 12083200. Throughput: 0: 1514.1, 1: 1353.3. Samples: 3014613. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:37,460][109198] Avg episode reward: [(0, '-2.627'), (1, '-2.810')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:37,467][63576] Saving new best policy, reward=-2.810!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:37,483][63771] DAMAGECOUNT value on done: 5268.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:37,483][63771] Sum rewards: -3.224, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.460', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO5': '0.020', 'AMMO4': '0.021', 'weapon4': '0.024', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'weapon7': '0.054', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.131', 'HITCOUNT': '0.150', 'weapon5': '0.158', 'WEAPON7': '0.200', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.850', 'weapon2': '1.300', 'weapon3': '1.758', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:37,775][63769] DAMAGECOUNT value on done: 6411.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:37,775][63769] Sum rewards: -4.015, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.666', 'AMMO5': '0.005', 'AMMO2': '0.013', 'weapon5': '0.020', 'AMMO4': '0.064', 'ARMOR': '0.076', 'WEAPON5': '0.100', 'AMMO3': '0.149', 'HITCOUNT': '0.160', 'WEAPON4': '0.350', 'weapon4': '0.482', 'DAMAGECOUNT': '0.660', 'WEAPON3': '1.000', 'weapon2': '1.230', 'weapon3': '1.842', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:37,820][63771] DAMAGECOUNT value on done: 7545.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:37,821][63771] Sum rewards: -6.640, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.492', 'AMMO4': '-0.037', 'AMMO2': '-0.007', 'AMMO5': '0.017', 'ARMOR': '0.036', 'weapon5': '0.066', 'HITCOUNT': '0.170', 'AMMO3': '0.171', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.567', 'WEAPON3': '1.100', 'weapon2': '1.486', 'weapon3': '1.832', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:38,739][63732] Updated weights for policy 0, policy_version 1510 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:40,432][63770] DAMAGECOUNT value on done: 8895.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:40,821][63770] DAMAGECOUNT value on done: 6108.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:41,529][63767] DAMAGECOUNT value on done: 9585.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:41,530][63767] Sum rewards: -4.914, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.130', 'AMMO4': '-0.004', 'AMMO2': '-0.001', 'AMMO5': '0.020', 'WEAPON1': '0.030', 'ARMOR': '0.048', 'weapon5': '0.070', 'AMMO3': '0.221', 'HITCOUNT': '0.290', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.930', 'weapon2': '1.196', 'WEAPON3': '1.300', 'weapon3': '2.266', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:41,855][63767] DAMAGECOUNT value on done: 9731.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:41,855][63767] Sum rewards: -5.349, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.030', 'AMMO5': '0.005', 'AMMO2': '0.013', 'weapon5': '0.026', 'WEAPON5': '0.050', 'ARMOR': '0.064', 'AMMO4': '0.064', 'AMMO3': '0.154', 'WEAPON4': '0.200', 'weapon4': '0.330', 'HITCOUNT': '0.350', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.900', 'weapon2': '1.008', 'DAMAGECOUNT': '1.275', 'weapon3': '1.992'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:42,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11468.8, 300 sec: 11191.1). Total num frames: 12136448. Throughput: 0: 1516.2, 1: 1353.6. Samples: 3031958. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:42,460][109198] Avg episode reward: [(0, '-2.723'), (1, '-2.918')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:43,307][63733] Updated weights for policy 1, policy_version 1450 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:44,191][63805] DAMAGECOUNT value on done: 9050.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:44,191][63805] Sum rewards: -3.047, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.510', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'WEAPON5': '0.100', 'AMMO3': '0.131', 'HITCOUNT': '0.250', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.870', 'FRAGCOUNT': '1.000', 'weapon2': '1.446', 'weapon3': '1.922'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:44,547][63805] DAMAGECOUNT value on done: 9033.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:44,547][63805] Sum rewards: -2.143, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.420', 'AMMO2': '0.004', 'AMMO5': '0.014', 'AMMO4': '0.022', 'ARMOR': '0.040', 'weapon4': '0.092', 'WEAPON4': '0.100', 'AMMO3': '0.140', 'weapon5': '0.152', 'WEAPON5': '0.300', 'HITCOUNT': '0.370', 'WEAPON3': '0.950', 'weapon2': '0.974', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.176', 'weapon3': '2.192'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:45,341][63732] Updated weights for policy 0, policy_version 1520 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:46,131][63734] DAMAGECOUNT value on done: 7585.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:46,132][63734] Sum rewards: -4.110, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.210', 'AMMO5': '0.005', 'weapon5': '0.016', 'AMMO2': '0.021', 'HITCOUNT': '0.080', 'AMMO3': '0.099', 'WEAPON5': '0.100', 'AMMO4': '0.103', 'WEAPON4': '0.250', 'weapon4': '0.266', 'DAMAGECOUNT': '0.435', 'ARMOR': '0.445', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.268', 'weapon2': '1.612'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:46,526][63734] DAMAGECOUNT value on done: 5984.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:46,527][63734] Sum rewards: -5.726, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.040', 'AMMO2': '0.004', 'AMMO5': '0.005', 'AMMO4': '0.022', 'ARMOR': '0.052', 'HITCOUNT': '0.090', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.148', 'AMMO3': '0.149', 'DAMAGECOUNT': '0.240', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.400', 'weapon3': '1.804'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:47,383][63771] DAMAGECOUNT value on done: 8888.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:47,383][63771] Sum rewards: -2.624, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.238', 'AMMO5': '0.005', 'AMMO2': '0.023', 'weapon5': '0.026', 'AMMO3': '0.089', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.114', 'ARMOR': '0.152', 'weapon4': '0.182', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.508', 'weapon2': '1.700'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:47,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11468.8, 300 sec: 11205.0). Total num frames: 12197888. Throughput: 0: 1518.8, 1: 1355.2. Samples: 3040809. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:47,459][109198] Avg episode reward: [(0, '-2.713'), (1, '-2.918')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:47,768][63771] DAMAGECOUNT value on done: 6275.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:47,769][63771] Sum rewards: -0.195, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.069', 'AMMO4': '-0.008', 'AMMO2': '-0.001', 'AMMO5': '0.007', 'ARMOR': '0.008', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'AMMO3': '0.129', 'weapon4': '0.156', 'HITCOUNT': '0.270', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.894', 'weapon2': '1.250', 'weapon3': '1.718', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:48,364][63806] DAMAGECOUNT value on done: 8085.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:48,721][63806] DAMAGECOUNT value on done: 7736.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:48,721][63806] Sum rewards: 6.558, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.380', 'AMMO2': '0.000', 'AMMO4': '0.000', 'WEAPON1': '0.010', 'AMMO5': '0.013', 'AMMO3': '0.146', 'weapon7': '0.178', 'HITCOUNT': '0.240', 'weapon5': '0.270', 'AMMO6': '0.320', 'AMMO7': '0.320', 'WEAPON5': '0.350', 'WEAPON7': '0.400', 'ARMOR': '0.482', 'WEAPON3': '0.750', 'weapon2': '1.006', 'DAMAGECOUNT': '1.308', 'weapon3': '1.894', 'FRAGCOUNT': '7.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:50,760][63735] DAMAGECOUNT value on done: 7868.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:50,760][63735] Sum rewards: -0.894, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.079', 'AMMO5': '0.003', 'AMMO2': '0.018', 'WEAPON5': '0.050', 'AMMO4': '0.089', 'weapon5': '0.124', 'HITCOUNT': '0.130', 'AMMO3': '0.147', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.447', 'ARMOR': '0.502', 'weapon4': '0.512', 'WEAPON3': '0.800', 'weapon2': '1.132', 'weapon3': '1.432', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:50,908][63733] Updated weights for policy 1, policy_version 1460 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:51,088][63735] DAMAGECOUNT value on done: 7994.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:51,089][63735] Sum rewards: -6.598, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.902', 'AMMO2': '0.011', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.053', 'WEAPON4': '0.100', 'weapon5': '0.112', 'AMMO3': '0.131', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'weapon4': '0.326', 'ARMOR': '0.432', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.154', 'weapon2': '1.752'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:51,112][63734] DAMAGECOUNT value on done: 8464.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:51,112][63734] Sum rewards: 0.149, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.432', 'AMMO2': '0.000', 'AMMO4': '0.002', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.072', 'AMMO3': '0.122', 'WEAPON4': '0.200', 'weapon5': '0.220', 'HITCOUNT': '0.250', 'WEAPON5': '0.300', 'weapon4': '0.452', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.825', 'weapon3': '1.192', 'weapon2': '1.470', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:51,513][63734] DAMAGECOUNT value on done: 7961.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:51,514][63734] Sum rewards: 3.562, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.882', 'AMMO2': '0.006', 'weapon5': '0.006', 'AMMO5': '0.007', 'AMMO4': '0.027', 'ARMOR': '0.067', 'WEAPON4': '0.100', 'AMMO3': '0.139', 'WEAPON5': '0.150', 'weapon4': '0.160', 'HITCOUNT': '0.400', 'WEAPON3': '0.850', 'weapon2': '1.434', 'DAMAGECOUNT': '1.671', 'weapon3': '1.926', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:51,857][63770] DAMAGECOUNT value on done: 7041.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:51,858][63770] Sum rewards: 0.112, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.606', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.022', 'WEAPON4': '0.050', 'weapon4': '0.052', 'AMMO3': '0.122', 'weapon5': '0.152', 'HITCOUNT': '0.160', 'WEAPON5': '0.450', 'ARMOR': '0.513', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.726', 'weapon3': '1.332', 'weapon2': '1.952', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:52,143][63732] Updated weights for policy 0, policy_version 1530 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:52,246][63770] DAMAGECOUNT value on done: 7415.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:52,247][63770] Sum rewards: -5.070, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.344', 'AMMO5': '0.015', 'AMMO2': '0.023', 'ARMOR': '0.076', 'AMMO3': '0.113', 'AMMO4': '0.116', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.206', 'HITCOUNT': '0.220', 'weapon4': '0.444', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.807', 'FRAGCOUNT': '1.000', 'weapon2': '1.310', 'weapon3': '1.444'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:52,458][109198] Fps is (10 sec: 11878.5, 60 sec: 11537.1, 300 sec: 11205.0). Total num frames: 12255232. Throughput: 0: 1515.9, 1: 1352.8. Samples: 3057874. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:52,460][109198] Avg episode reward: [(0, '-2.419'), (1, '-2.893')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:53,872][63769] DAMAGECOUNT value on done: 8075.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:53,873][63769] Sum rewards: -0.019, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.354', 'AMMO2': '0.014', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.067', 'weapon5': '0.126', 'AMMO3': '0.139', 'WEAPON4': '0.150', 'WEAPON5': '0.250', 'weapon4': '0.280', 'HITCOUNT': '0.350', 'ARMOR': '0.496', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.116', 'weapon3': '1.316', 'weapon2': '1.696', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:54,266][63769] DAMAGECOUNT value on done: 7719.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:54,266][63769] Sum rewards: -1.679, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.970', 'AMMO5': '0.008', 'AMMO2': '0.021', 'ARMOR': '0.080', 'weapon5': '0.080', 'WEAPON4': '0.100', 'AMMO4': '0.104', 'AMMO3': '0.115', 'weapon4': '0.134', 'WEAPON5': '0.150', 'HITCOUNT': '0.240', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.978', 'weapon2': '1.632', 'weapon3': '1.650', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:56,079][63767] DAMAGECOUNT value on done: 9174.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:56,080][63767] Sum rewards: -4.997, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.301', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'AMMO5': '0.019', 'ARMOR': '0.036', 'AMMO4': '0.042', 'AMMO3': '0.075', 'weapon4': '0.094', 'WEAPON4': '0.100', 'HITCOUNT': '0.240', 'WEAPON5': '0.300', 'weapon5': '0.418', 'WEAPON3': '0.550', 'weapon2': '1.182', 'DAMAGECOUNT': '1.347', 'FRAGCOUNT': '1.500', 'weapon3': '1.632'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:56,451][63767] DAMAGECOUNT value on done: 7770.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:56,452][63767] Sum rewards: -6.262, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.604', 'weapon5': '0.008', 'AMMO2': '0.012', 'ARMOR': '0.012', 'AMMO5': '0.012', 'AMMO4': '0.058', 'AMMO3': '0.137', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.519', 'weapon4': '0.544', 'weapon2': '0.944', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '1.896'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:57,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11537.1, 300 sec: 11218.9). Total num frames: 12312576. Throughput: 0: 1520.7, 1: 1357.8. Samples: 3075282. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:54:57,460][109198] Avg episode reward: [(0, '-2.386'), (1, '-2.940')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:57,624][63735] DAMAGECOUNT value on done: 8067.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:57,925][63735] DAMAGECOUNT value on done: 5636.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:57,926][63735] Sum rewards: -3.497, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.171', 'AMMO4': '-0.037', 'AMMO2': '-0.007', 'AMMO5': '0.005', 'weapon5': '0.016', 'ARMOR': '0.040', 'WEAPON1': '0.040', 'weapon4': '0.078', 'AMMO3': '0.094', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.140', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.465', 'FRAGCOUNT': '1.000', 'weapon3': '1.132', 'weapon2': '1.808'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:58,321][63733] Updated weights for policy 1, policy_version 1470 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:58,429][63806] DAMAGECOUNT value on done: 6129.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:58,430][63806] Sum rewards: -3.165, reward structure: {'DEATHCOUNT': '-9.000', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.015', 'WEAPON5': '0.050', 'AMMO4': '0.073', 'HEALTH': '0.080', 'AMMO3': '0.099', 'HITCOUNT': '0.110', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.630', 'weapon3': '1.710'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:58,510][63805] DAMAGECOUNT value on done: 10021.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:58,761][63806] DAMAGECOUNT value on done: 8945.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:58,809][63732] Updated weights for policy 0, policy_version 1540 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:58,844][63805] DAMAGECOUNT value on done: 6992.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:54:58,845][63805] Sum rewards: -1.759, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.829', 'AMMO5': '0.003', 'ARMOR': '0.004', 'weapon5': '0.008', 'AMMO2': '0.012', 'WEAPON5': '0.050', 'AMMO4': '0.057', 'AMMO3': '0.113', 'WEAPON4': '0.200', 'weapon4': '0.230', 'HITCOUNT': '0.280', 'WEAPON3': '0.800', 'weapon2': '0.962', 'DAMAGECOUNT': '1.242', 'weapon3': '2.110', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:00,229][63769] DAMAGECOUNT value on done: 8797.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:00,553][63769] DAMAGECOUNT value on done: 6646.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:00,554][63769] Sum rewards: 0.175, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.990', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'weapon5': '0.048', 'AMMO4': '0.054', 'weapon4': '0.064', 'AMMO3': '0.073', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'HITCOUNT': '0.160', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.705', 'weapon3': '1.614', 'weapon2': '1.618', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:00,773][63771] DAMAGECOUNT value on done: 5498.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:00,774][63771] Sum rewards: -5.819, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.839', 'AMMO2': '0.006', 'WEAPON1': '0.020', 'AMMO5': '0.025', 'AMMO4': '0.030', 'weapon5': '0.050', 'WEAPON4': '0.100', 'AMMO3': '0.194', 'HITCOUNT': '0.220', 'weapon4': '0.220', 'WEAPON5': '0.350', 'ARMOR': '0.473', 'DAMAGECOUNT': '0.690', 'WEAPON3': '1.150', 'weapon2': '1.312', 'weapon3': '1.930', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:01,193][63771] DAMAGECOUNT value on done: 8093.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:01,193][63771] Sum rewards: -3.640, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.716', 'AMMO2': '0.002', 'ARMOR': '0.004', 'AMMO4': '0.008', 'AMMO5': '0.019', 'AMMO3': '0.163', 'weapon5': '0.298', 'WEAPON5': '0.300', 'HITCOUNT': '0.340', 'FRAGCOUNT': '0.500', 'weapon2': '0.540', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.644', 'weapon3': '2.208'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:02,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11537.1, 300 sec: 11218.9). Total num frames: 12369920. Throughput: 0: 1526.6, 1: 1361.2. Samples: 3084039. Policy #0 lag: (min: 0.0, avg: 0.4, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:02,460][109198] Avg episode reward: [(0, '-2.517'), (1, '-2.975')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:04,494][63767] DAMAGECOUNT value on done: 9675.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:04,494][63767] Sum rewards: -3.996, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.542', 'AMMO5': '0.010', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'weapon5': '0.070', 'AMMO4': '0.090', 'HITCOUNT': '0.110', 'AMMO3': '0.124', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.270', 'weapon4': '0.276', 'ARMOR': '0.463', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.344', 'weapon3': '1.450'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:04,850][63767] DAMAGECOUNT value on done: 10195.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:04,851][63767] Sum rewards: -1.098, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.492', 'AMMO2': '0.004', 'AMMO5': '0.005', 'AMMO4': '0.019', 'weapon5': '0.056', 'WEAPON5': '0.100', 'AMMO3': '0.140', 'WEAPON4': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon4': '0.378', 'HITCOUNT': '0.400', 'ARMOR': '0.472', 'WEAPON3': '0.700', 'weapon3': '1.320', 'DAMAGECOUNT': '1.392', 'weapon2': '1.608', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:05,495][63770] DAMAGECOUNT value on done: 9030.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:05,496][63770] Sum rewards: -3.068, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.771', 'AMMO4': '-0.047', 'AMMO2': '-0.009', 'AMMO5': '0.005', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.122', 'AMMO3': '0.141', 'HITCOUNT': '0.150', 'weapon7': '0.152', 'weapon4': '0.266', 'AMMO6': '0.320', 'AMMO7': '0.320', 'WEAPON7': '0.400', 'DAMAGECOUNT': '0.405', 'ARMOR': '0.460', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.800', 'weapon3': '1.352', 'weapon2': '1.416'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:05,580][63732] Updated weights for policy 0, policy_version 1550 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:05,916][63733] Updated weights for policy 1, policy_version 1480 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:05,934][63770] DAMAGECOUNT value on done: 6728.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:05,934][63770] Sum rewards: -1.362, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.169', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'ARMOR': '0.004', 'AMMO5': '0.007', 'weapon5': '0.020', 'AMMO3': '0.101', 'WEAPON5': '0.150', 'HITCOUNT': '0.470', 'WEAPON3': '0.600', 'weapon3': '1.388', 'weapon2': '1.728', 'DAMAGECOUNT': '1.860', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:07,459][109198] Fps is (10 sec: 11468.6, 60 sec: 11537.0, 300 sec: 11218.9). Total num frames: 12427264. Throughput: 0: 1526.6, 1: 1361.7. Samples: 3101266. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:07,460][109198] Avg episode reward: [(0, '-2.599'), (1, '-2.973')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:07,501][63805] DAMAGECOUNT value on done: 9268.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:07,502][63805] Sum rewards: -1.182, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.584', 'AMMO2': '0.003', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO4': '0.016', 'ARMOR': '0.052', 'weapon5': '0.062', 'WEAPON5': '0.100', 'AMMO3': '0.155', 'HITCOUNT': '0.260', 'DAMAGECOUNT': '0.654', 'WEAPON3': '0.750', 'weapon2': '1.150', 'weapon3': '2.184', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:07,824][63805] DAMAGECOUNT value on done: 9389.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:07,824][63805] Sum rewards: -2.168, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.354', 'AMMO5': '0.013', 'AMMO2': '0.029', 'weapon5': '0.068', 'ARMOR': '0.072', 'WEAPON5': '0.100', 'weapon4': '0.118', 'AMMO3': '0.133', 'AMMO4': '0.147', 'WEAPON4': '0.150', 'HITCOUNT': '0.270', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.068', 'weapon3': '1.366', 'weapon2': '1.652', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:10,453][63771] DAMAGECOUNT value on done: 9185.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:10,453][63771] Sum rewards: -4.360, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.942', 'AMMO2': '0.008', 'AMMO5': '0.010', 'weapon5': '0.016', 'AMMO4': '0.040', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.102', 'weapon4': '0.120', 'HITCOUNT': '0.280', 'ARMOR': '0.507', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.891', 'weapon2': '1.472', 'weapon3': '1.586', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:10,782][63771] DAMAGECOUNT value on done: 6576.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:10,805][63806] DAMAGECOUNT value on done: 8554.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:10,805][63806] Sum rewards: 0.082, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.828', 'AMMO5': '0.006', 'AMMO2': '0.014', 'ARMOR': '0.040', 'AMMO4': '0.069', 'AMMO3': '0.131', 'WEAPON5': '0.150', 'HITCOUNT': '0.200', 'weapon5': '0.212', 'weapon4': '0.218', 'WEAPON4': '0.250', 'WEAPON3': '0.750', 'weapon2': '1.406', 'DAMAGECOUNT': '1.407', 'weapon3': '1.556', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:11,113][63734] DAMAGECOUNT value on done: 7734.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:11,113][63734] Sum rewards: -1.256, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.316', 'AMMO2': '0.009', 'ARMOR': '0.016', 'AMMO5': '0.020', 'AMMO4': '0.045', 'WEAPON4': '0.050', 'AMMO3': '0.105', 'HITCOUNT': '0.160', 'weapon5': '0.202', 'weapon4': '0.254', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.447', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.158', 'weapon3': '1.444'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:11,179][63806] DAMAGECOUNT value on done: 8047.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:11,180][63806] Sum rewards: -1.178, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.650', 'AMMO2': '0.002', 'AMMO4': '0.007', 'AMMO5': '0.010', 'ARMOR': '0.056', 'WEAPON4': '0.100', 'AMMO3': '0.138', 'weapon5': '0.240', 'HITCOUNT': '0.280', 'WEAPON5': '0.300', 'weapon4': '0.386', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.933', 'weapon2': '1.220', 'weapon3': '1.500', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:11,499][63734] DAMAGECOUNT value on done: 6109.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:11,499][63734] Sum rewards: -4.072, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.381', 'AMMO5': '0.013', 'weapon5': '0.014', 'AMMO2': '0.021', 'WEAPON1': '0.040', 'ARMOR': '0.048', 'AMMO3': '0.072', 'AMMO4': '0.104', 'HITCOUNT': '0.110', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.400', 'weapon4': '0.502', 'weapon3': '0.870', 'FRAGCOUNT': '1.000', 'weapon2': '1.490'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:12,289][63732] Updated weights for policy 0, policy_version 1560 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:12,459][109198] Fps is (10 sec: 11468.5, 60 sec: 11468.8, 300 sec: 11232.8). Total num frames: 12484608. Throughput: 0: 1528.5, 1: 1362.4. Samples: 3118583. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:12,460][109198] Avg episode reward: [(0, '-2.519'), (1, '-3.027')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:13,428][63733] Updated weights for policy 1, policy_version 1490 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:13,535][63735] DAMAGECOUNT value on done: 8116.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:13,536][63735] Sum rewards: -2.784, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.440', 'AMMO2': '0.008', 'weapon5': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.039', 'ARMOR': '0.040', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon7': '0.134', 'HITCOUNT': '0.140', 'AMMO3': '0.145', 'WEAPON7': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.228', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.744', 'WEAPON3': '0.800', 'weapon2': '1.362', 'weapon3': '1.604', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:13,938][63735] DAMAGECOUNT value on done: 8461.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:13,939][63735] Sum rewards: 1.164, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.519', 'AMMO2': '0.001', 'AMMO4': '0.004', 'weapon5': '0.012', 'AMMO5': '0.013', 'ARMOR': '0.020', 'WEAPON4': '0.100', 'AMMO3': '0.122', 'weapon4': '0.208', 'WEAPON5': '0.250', 'HITCOUNT': '0.380', 'WEAPON3': '0.850', 'weapon2': '1.048', 'DAMAGECOUNT': '1.401', 'weapon3': '2.024', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:14,353][63734] DAMAGECOUNT value on done: 8594.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:14,353][63734] Sum rewards: -2.315, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.430', 'AMMO2': '0.003', 'AMMO5': '0.014', 'AMMO4': '0.015', 'ARMOR': '0.072', 'weapon5': '0.098', 'AMMO3': '0.115', 'HITCOUNT': '0.120', 'WEAPON4': '0.150', 'weapon4': '0.290', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.034', 'weapon2': '1.714'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:14,700][63734] DAMAGECOUNT value on done: 8209.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:14,701][63734] Sum rewards: -8.335, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-1.296', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'AMMO2': '0.022', 'weapon5': '0.032', 'weapon4': '0.082', 'AMMO4': '0.111', 'WEAPON4': '0.150', 'AMMO3': '0.171', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'DAMAGECOUNT': '0.744', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.692', 'weapon2': '1.772'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:17,098][63770] DAMAGECOUNT value on done: 7130.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:17,295][63769] DAMAGECOUNT value on done: 8729.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:17,295][63769] Sum rewards: 2.295, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.646', 'AMMO4': '-0.017', 'AMMO2': '-0.003', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'ARMOR': '0.020', 'AMMO3': '0.135', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.250', 'weapon5': '0.268', 'HITCOUNT': '0.340', 'WEAPON3': '0.900', 'weapon2': '1.094', 'DAMAGECOUNT': '1.962', 'weapon3': '2.120', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:17,458][109198] Fps is (10 sec: 11469.0, 60 sec: 11537.1, 300 sec: 11232.8). Total num frames: 12541952. Throughput: 0: 1527.9, 1: 1362.6. Samples: 3127174. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:17,460][109198] Avg episode reward: [(0, '-2.446'), (1, '-3.027')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:17,517][63770] DAMAGECOUNT value on done: 7710.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:17,517][63770] Sum rewards: -0.583, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'ARMOR': '0.040', 'AMMO4': '0.044', 'AMMO3': '0.119', 'WEAPON4': '0.150', 'weapon4': '0.164', 'HITCOUNT': '0.200', 'HEALTH': '0.254', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.885', 'weapon2': '1.528', 'weapon3': '1.664', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:17,705][63769] DAMAGECOUNT value on done: 7894.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:17,708][63769] Sum rewards: -7.442, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.648', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO4': '0.022', 'AMMO5': '0.028', 'weapon4': '0.076', 'WEAPON4': '0.100', 'weapon5': '0.108', 'HITCOUNT': '0.160', 'AMMO3': '0.212', 'WEAPON5': '0.450', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.525', 'WEAPON3': '0.900', 'weapon3': '1.484', 'weapon2': '1.626'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:18,831][63767] DAMAGECOUNT value on done: 9249.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:18,831][63767] Sum rewards: -0.263, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.018', 'weapon5': '0.024', 'HITCOUNT': '0.050', 'AMMO3': '0.076', 'ARMOR': '0.084', 'AMMO4': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.225', 'weapon4': '0.232', 'WEAPON3': '0.450', 'HEALTH': '0.458', 'FRAGCOUNT': '1.000', 'weapon2': '1.184', 'weapon3': '1.578'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:19,138][63732] Updated weights for policy 0, policy_version 1570 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:19,184][63767] DAMAGECOUNT value on done: 8275.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:19,185][63767] Sum rewards: 2.312, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.992', 'AMMO5': '0.005', 'AMMO2': '0.008', 'AMMO4': '0.040', 'weapon5': '0.042', 'AMMO3': '0.080', 'ARMOR': '0.088', 'WEAPON5': '0.100', 'WEAPON4': '0.300', 'weapon4': '0.340', 'HITCOUNT': '0.390', 'WEAPON3': '0.500', 'weapon2': '1.468', 'DAMAGECOUNT': '1.515', 'weapon3': '1.678', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:20,362][63735] DAMAGECOUNT value on done: 8279.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:20,363][63735] Sum rewards: 0.040, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.717', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO2': '0.027', 'AMMO3': '0.081', 'weapon5': '0.128', 'AMMO4': '0.135', 'WEAPON5': '0.150', 'HITCOUNT': '0.190', 'WEAPON4': '0.250', 'weapon4': '0.340', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.636', 'weapon2': '1.232', 'weapon3': '1.460', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:20,687][63735] DAMAGECOUNT value on done: 5756.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:20,996][63806] DAMAGECOUNT value on done: 6508.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:20,997][63806] Sum rewards: -6.038, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.972', 'AMMO2': '0.008', 'ARMOR': '0.008', 'AMMO4': '0.039', 'WEAPON4': '0.050', 'weapon4': '0.136', 'AMMO3': '0.188', 'HITCOUNT': '0.300', 'weapon2': '0.954', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.137', 'WEAPON3': '1.150', 'weapon3': '2.214'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:21,180][63733] Updated weights for policy 1, policy_version 1500 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:21,398][63806] DAMAGECOUNT value on done: 9095.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:21,399][63806] Sum rewards: -5.251, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.021', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.008', 'AMMO2': '-0.001', 'AMMO5': '0.004', 'WEAPON1': '0.020', 'weapon5': '0.028', 'AMMO3': '0.085', 'WEAPON5': '0.100', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.550', 'weapon3': '1.408', 'weapon2': '1.714'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:21,429][63805] DAMAGECOUNT value on done: 10248.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:21,429][63805] Sum rewards: -3.757, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.871', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.018', 'weapon4': '0.048', 'ARMOR': '0.060', 'AMMO4': '0.090', 'WEAPON4': '0.100', 'AMMO3': '0.154', 'weapon5': '0.156', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'DAMAGECOUNT': '0.681', 'WEAPON3': '0.850', 'weapon2': '1.260', 'weapon3': '1.996', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:21,775][63805] DAMAGECOUNT value on done: 7174.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:21,776][63805] Sum rewards: -4.792, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.280', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'ARMOR': '0.072', 'AMMO3': '0.122', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.546', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.780', 'weapon3': '1.806'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:22,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11468.8, 300 sec: 11218.9). Total num frames: 12595200. Throughput: 0: 1522.0, 1: 1354.5. Samples: 3144054. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:22,460][109198] Avg episode reward: [(0, '-2.518'), (1, '-2.928')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:23,471][63769] DAMAGECOUNT value on done: 9012.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:23,797][63769] DAMAGECOUNT value on done: 6934.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:23,797][63769] Sum rewards: -5.256, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.350', 'AMMO5': '0.003', 'AMMO2': '0.006', 'AMMO4': '0.031', 'AMMO3': '0.146', 'HITCOUNT': '0.230', 'DAMAGECOUNT': '0.864', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.328', 'weapon3': '2.036'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:24,221][63771] DAMAGECOUNT value on done: 5824.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:24,222][63771] Sum rewards: 0.522, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.855', 'AMMO5': '0.003', 'AMMO2': '0.009', 'weapon5': '0.010', 'ARMOR': '0.040', 'AMMO4': '0.047', 'WEAPON5': '0.050', 'AMMO3': '0.120', 'HITCOUNT': '0.300', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.978', 'weapon3': '1.654', 'weapon2': '1.666', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:24,661][63771] DAMAGECOUNT value on done: 8309.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:24,662][63771] Sum rewards: -0.917, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.976', 'weapon5': '0.002', 'AMMO5': '0.010', 'AMMO2': '0.030', 'ARMOR': '0.052', 'AMMO3': '0.147', 'AMMO4': '0.148', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'WEAPON4': '0.350', 'weapon4': '0.546', 'DAMAGECOUNT': '0.648', 'WEAPON3': '0.750', 'weapon2': '0.760', 'weapon3': '1.796', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:25,957][63732] Updated weights for policy 0, policy_version 1580 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:27,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11537.1, 300 sec: 11246.6). Total num frames: 12656640. Throughput: 0: 1518.3, 1: 1351.2. Samples: 3161082. Policy #0 lag: (min: 0.0, avg: 0.3, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:27,460][109198] Avg episode reward: [(0, '-2.459'), (1, '-2.951')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:27,947][63767] DAMAGECOUNT value on done: 9785.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:27,948][63767] Sum rewards: -1.616, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.078', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.051', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.113', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.330', 'weapon4': '0.344', 'ARMOR': '0.567', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.320', 'weapon3': '1.462'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:28,311][63767] DAMAGECOUNT value on done: 11140.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:28,312][63767] Sum rewards: 5.121, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.926', 'AMMO2': '0.017', 'AMMO5': '0.027', 'weapon7': '0.038', 'ARMOR': '0.056', 'AMMO4': '0.083', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.116', 'WEAPON4': '0.250', 'weapon5': '0.260', 'HITCOUNT': '0.300', 'WEAPON5': '0.350', 'weapon4': '0.462', 'WEAPON3': '0.650', 'weapon2': '1.060', 'weapon3': '1.492', 'DAMAGECOUNT': '2.835', 'FRAGCOUNT': '4.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:28,768][63733] Updated weights for policy 1, policy_version 1510 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:30,779][63805] DAMAGECOUNT value on done: 9490.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:30,779][63805] Sum rewards: -5.836, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.314', 'AMMO5': '0.010', 'AMMO2': '0.016', 'AMMO4': '0.080', 'WEAPON4': '0.100', 'ARMOR': '0.112', 'weapon5': '0.122', 'AMMO3': '0.139', 'HITCOUNT': '0.190', 'WEAPON5': '0.250', 'weapon4': '0.278', 'DAMAGECOUNT': '0.666', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.362', 'weapon3': '1.602'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:30,969][63770] DAMAGECOUNT value on done: 9523.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:30,969][63770] Sum rewards: 3.513, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.426', 'AMMO5': '0.010', 'AMMO2': '0.018', 'AMMO3': '0.070', 'AMMO4': '0.091', 'ARMOR': '0.116', 'WEAPON4': '0.150', 'weapon5': '0.196', 'weapon4': '0.214', 'WEAPON5': '0.250', 'HITCOUNT': '0.390', 'WEAPON3': '0.450', 'weapon2': '0.858', 'DAMAGECOUNT': '1.479', 'weapon3': '1.646', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:31,107][63805] DAMAGECOUNT value on done: 9837.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:31,108][63805] Sum rewards: 0.947, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.267', 'weapon4': '0.010', 'AMMO2': '0.011', 'AMMO5': '0.018', 'ARMOR': '0.028', 'AMMO4': '0.055', 'WEAPON4': '0.100', 'weapon5': '0.132', 'AMMO3': '0.186', 'WEAPON5': '0.300', 'HITCOUNT': '0.400', 'WEAPON3': '0.900', 'weapon2': '1.202', 'DAMAGECOUNT': '1.344', 'weapon3': '2.278', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:31,421][63770] DAMAGECOUNT value on done: 6833.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:31,422][63770] Sum rewards: -2.918, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.399', 'AMMO2': '0.003', 'AMMO4': '0.012', 'AMMO5': '0.015', 'ARMOR': '0.016', 'WEAPON1': '0.020', 'weapon5': '0.030', 'HITCOUNT': '0.100', 'AMMO3': '0.107', 'WEAPON4': '0.150', 'weapon4': '0.282', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.352', 'weapon3': '1.580'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:32,458][109198] Fps is (10 sec: 11469.1, 60 sec: 11468.8, 300 sec: 11232.8). Total num frames: 12709888. Throughput: 0: 1514.4, 1: 1349.6. Samples: 3169685. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:32,460][109198] Avg episode reward: [(0, '-2.347'), (1, '-2.980')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:32,646][63732] Updated weights for policy 0, policy_version 1590 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:33,637][63771] DAMAGECOUNT value on done: 9585.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:33,637][63771] Sum rewards: -1.684, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.060', 'AMMO4': '-0.045', 'AMMO2': '-0.009', 'ARMOR': '0.044', 'AMMO3': '0.082', 'WEAPON4': '0.200', 'weapon4': '0.240', 'HITCOUNT': '0.260', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.200', 'weapon3': '1.358', 'weapon2': '1.946', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:33,838][63806] DAMAGECOUNT value on done: 8998.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:33,839][63806] Sum rewards: 1.916, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.536', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'WEAPON1': '0.010', 'AMMO5': '0.022', 'AMMO3': '0.138', 'weapon5': '0.152', 'weapon7': '0.188', 'HITCOUNT': '0.300', 'WEAPON5': '0.400', 'AMMO6': '0.420', 'AMMO7': '0.420', 'ARMOR': '0.487', 'WEAPON7': '0.500', 'WEAPON3': '0.850', 'weapon2': '1.186', 'DAMAGECOUNT': '1.332', 'weapon3': '1.822', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:34,034][63771] DAMAGECOUNT value on done: 6663.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:34,221][63806] DAMAGECOUNT value on done: 8087.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:34,221][63806] Sum rewards: -7.248, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.148', 'AMMO2': '0.016', 'AMMO5': '0.023', 'ARMOR': '0.023', 'WEAPON1': '0.030', 'HITCOUNT': '0.050', 'AMMO4': '0.081', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.120', 'AMMO3': '0.127', 'weapon4': '0.204', 'weapon5': '0.280', 'WEAPON5': '0.400', 'WEAPON3': '0.550', 'weapon2': '1.428', 'weapon3': '1.468'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:36,344][63733] Updated weights for policy 1, policy_version 1520 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:36,420][63734] DAMAGECOUNT value on done: 8091.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:36,421][63734] Sum rewards: 1.501, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO5': '0.007', 'ARMOR': '0.008', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'weapon4': '0.026', 'AMMO4': '0.082', 'AMMO3': '0.113', 'weapon5': '0.116', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon7': '0.122', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.250', 'HEALTH': '0.362', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.071', 'weapon2': '1.086', 'weapon3': '1.990', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:36,439][63735] DAMAGECOUNT value on done: 8354.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:36,439][63735] Sum rewards: -4.055, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.393', 'AMMO5': '0.010', 'AMMO2': '0.012', 'AMMO4': '0.062', 'ARMOR': '0.068', 'weapon5': '0.090', 'WEAPON5': '0.100', 'AMMO3': '0.148', 'WEAPON4': '0.250', 'HITCOUNT': '0.250', 'weapon4': '0.298', 'DAMAGECOUNT': '0.714', 'WEAPON3': '0.850', 'weapon2': '1.262', 'weapon3': '1.724', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:36,809][63734] DAMAGECOUNT value on done: 6279.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:36,814][63735] DAMAGECOUNT value on done: 9011.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:36,814][63735] Sum rewards: -1.071, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.923', 'weapon7': '0.006', 'AMMO5': '0.007', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'weapon5': '0.012', 'ARMOR': '0.040', 'AMMO4': '0.047', 'WEAPON4': '0.050', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.124', 'AMMO3': '0.164', 'HITCOUNT': '0.390', 'WEAPON3': '0.850', 'weapon2': '1.228', 'DAMAGECOUNT': '1.650', 'weapon3': '2.114', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:37,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11468.8, 300 sec: 11260.5). Total num frames: 12771328. Throughput: 0: 1517.1, 1: 1352.4. Samples: 3187000. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:37,460][109198] Avg episode reward: [(0, '-2.363'), (1, '-2.944')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:38,033][63734] DAMAGECOUNT value on done: 8833.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:38,390][63734] DAMAGECOUNT value on done: 8459.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:38,391][63734] Sum rewards: -5.022, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.530', 'AMMO4': '-0.043', 'AMMO2': '-0.009', 'AMMO5': '0.013', 'weapon5': '0.034', 'HITCOUNT': '0.150', 'AMMO3': '0.165', 'WEAPON5': '0.250', 'ARMOR': '0.456', 'DAMAGECOUNT': '0.750', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon2': '1.098', 'weapon3': '2.344'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:39,377][63732] Updated weights for policy 0, policy_version 1600 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:40,579][63769] DAMAGECOUNT value on done: 8902.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:40,580][63769] Sum rewards: -3.594, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.836', 'weapon7': '0.002', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'weapon5': '0.064', 'ARMOR': '0.076', 'AMMO4': '0.083', 'HITCOUNT': '0.120', 'AMMO3': '0.165', 'WEAPON5': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON4': '0.250', 'weapon4': '0.412', 'DAMAGECOUNT': '0.519', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.292', 'weapon3': '1.572'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:40,984][63769] DAMAGECOUNT value on done: 8279.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:40,984][63769] Sum rewards: 2.262, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.530', 'weapon5': '0.002', 'AMMO5': '0.005', 'AMMO2': '0.014', 'ARMOR': '0.040', 'AMMO4': '0.067', 'WEAPON5': '0.100', 'AMMO3': '0.131', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.260', 'weapon4': '0.294', 'WEAPON4': '0.300', 'WEAPON3': '0.800', 'weapon2': '1.144', 'DAMAGECOUNT': '1.155', 'weapon3': '1.880', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:41,871][63767] DAMAGECOUNT value on done: 9518.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:41,871][63767] Sum rewards: 0.061, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.670', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.009', 'weapon4': '0.014', 'WEAPON1': '0.020', 'weapon5': '0.034', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'AMMO3': '0.104', 'HITCOUNT': '0.220', 'DAMAGECOUNT': '0.807', 'WEAPON3': '0.850', 'weapon2': '1.314', 'weapon3': '1.916', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:42,286][63767] DAMAGECOUNT value on done: 8335.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:42,287][63767] Sum rewards: -1.838, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.495', 'AMMO2': '0.001', 'AMMO4': '0.007', 'WEAPON1': '0.020', 'ARMOR': '0.020', 'WEAPON4': '0.050', 'HITCOUNT': '0.070', 'AMMO3': '0.105', 'DAMAGECOUNT': '0.180', 'weapon4': '0.180', 'WEAPON3': '0.700', 'weapon2': '0.978', 'weapon3': '1.346', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:42,458][109198] Fps is (10 sec: 11878.3, 60 sec: 11537.1, 300 sec: 11274.4). Total num frames: 12828672. Throughput: 0: 1516.6, 1: 1348.2. Samples: 3204195. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:42,460][109198] Avg episode reward: [(0, '-2.380'), (1, '-2.873')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:42,465][63770] DAMAGECOUNT value on done: 7475.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:42,465][63770] Sum rewards: -1.088, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.935', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'weapon5': '0.002', 'AMMO5': '0.003', 'WEAPON5': '0.050', 'AMMO3': '0.117', 'WEAPON4': '0.200', 'weapon4': '0.272', 'HITCOUNT': '0.290', 'ARMOR': '0.508', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.035', 'weapon2': '1.126', 'weapon3': '1.698', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:42,857][63770] DAMAGECOUNT value on done: 7900.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:42,857][63770] Sum rewards: -4.657, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.712', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'AMMO5': '0.013', 'weapon5': '0.014', 'ARMOR': '0.036', 'AMMO4': '0.044', 'WEAPON4': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.160', 'weapon4': '0.180', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.114', 'weapon3': '1.966'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:42,867][63735] DAMAGECOUNT value on done: 8409.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:42,868][63735] Sum rewards: -2.975, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.587', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.003', 'AMMO2': '0.003', 'weapon5': '0.006', 'AMMO4': '0.013', 'WEAPON1': '0.020', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'AMMO3': '0.070', 'HITCOUNT': '0.080', 'weapon4': '0.086', 'WEAPON4': '0.100', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.390', 'weapon3': '1.304', 'weapon2': '1.594'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:43,246][63735] DAMAGECOUNT value on done: 5915.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:43,247][63735] Sum rewards: -9.864, reward structure: {'DEATHCOUNT': '-15.000', 'HEALTH': '-1.596', 'AMMO2': '0.009', 'AMMO4': '0.044', 'ARMOR': '0.108', 'weapon4': '0.126', 'WEAPON4': '0.150', 'AMMO3': '0.176', 'HITCOUNT': '0.200', 'DAMAGECOUNT': '0.477', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.680', 'weapon3': '1.912'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:43,616][63770] Large shaping reward 2.606 for [('FRAGCOUNT', 2.0, 2.0), ('HITCOUNT', 0.05, 5), ('DAMAGECOUNT', 0.555, 185.0), ('AMMO3', -0.001, -2.0), ('weapon3', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:43,678][63806] DAMAGECOUNT value on done: 6771.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:43,678][63806] Sum rewards: -2.079, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.386', 'AMMO5': '0.005', 'AMMO2': '0.009', 'AMMO4': '0.045', 'weapon4': '0.048', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.136', 'weapon5': '0.140', 'HITCOUNT': '0.250', 'DAMAGECOUNT': '0.789', 'WEAPON3': '0.850', 'weapon2': '0.976', 'weapon3': '2.108', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:44,022][63806] DAMAGECOUNT value on done: 9295.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:44,023][63806] Sum rewards: -8.228, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.926', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'weapon5': '0.006', 'ARMOR': '0.016', 'AMMO5': '0.019', 'WEAPON1': '0.020', 'WEAPON4': '0.100', 'weapon4': '0.104', 'HITCOUNT': '0.150', 'AMMO3': '0.168', 'WEAPON5': '0.200', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.600', 'WEAPON3': '1.000', 'weapon3': '1.368', 'weapon2': '1.466'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:44,123][63733] Updated weights for policy 1, policy_version 1530 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:44,255][63805] DAMAGECOUNT value on done: 10508.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:44,255][63805] Sum rewards: -6.969, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-0.524', 'weapon5': '0.002', 'AMMO2': '0.004', 'AMMO5': '0.012', 'AMMO4': '0.017', 'ARMOR': '0.080', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'AMMO3': '0.168', 'DAMAGECOUNT': '0.780', 'WEAPON3': '1.000', 'weapon2': '1.394', 'FRAGCOUNT': '2.000', 'weapon3': '2.048'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:44,617][63805] DAMAGECOUNT value on done: 7174.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:45,747][63732] Updated weights for policy 0, policy_version 1610 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:46,442][63769] DAMAGECOUNT value on done: 9157.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:46,442][63769] Sum rewards: -0.210, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.489', 'AMMO4': '-0.055', 'AMMO2': '-0.011', 'AMMO3': '0.083', 'HITCOUNT': '0.090', 'ARMOR': '0.432', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon2': '1.478', 'weapon3': '1.626'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:46,838][63769] DAMAGECOUNT value on done: 7169.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:46,839][63769] Sum rewards: -5.983, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.626', 'AMMO4': '-0.033', 'AMMO2': '-0.007', 'WEAPON4': '0.100', 'AMMO3': '0.149', 'weapon4': '0.174', 'HITCOUNT': '0.180', 'ARMOR': '0.471', 'DAMAGECOUNT': '0.705', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.254', 'weapon2': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:47,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11400.5, 300 sec: 11274.4). Total num frames: 12881920. Throughput: 0: 1524.4, 1: 1335.6. Samples: 3212737. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:47,460][109198] Avg episode reward: [(0, '-2.395'), (1, '-3.051')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:47,896][63771] DAMAGECOUNT value on done: 6124.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:47,897][63771] Sum rewards: -7.017, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-3.605', 'FRAGCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.013', 'AMMO4': '0.022', 'ARMOR': '0.056', 'weapon5': '0.100', 'AMMO3': '0.149', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'weapon4': '0.270', 'DAMAGECOUNT': '0.900', 'WEAPON3': '1.050', 'weapon2': '1.296', 'weapon3': '1.848'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:48,294][63771] DAMAGECOUNT value on done: 8627.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:48,294][63771] Sum rewards: -3.730, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.080', 'AMMO2': '0.007', 'AMMO5': '0.007', 'AMMO4': '0.035', 'weapon5': '0.078', 'AMMO3': '0.153', 'WEAPON5': '0.200', 'HITCOUNT': '0.250', 'WEAPON4': '0.250', 'weapon4': '0.480', 'ARMOR': '0.511', 'WEAPON3': '0.950', 'DAMAGECOUNT': '0.954', 'weapon2': '1.166', 'weapon3': '1.558', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:51,041][63767] DAMAGECOUNT value on done: 9871.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:51,041][63767] Sum rewards: -2.278, reward structure: {'DEATHCOUNT': '-5.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.722', 'AMMO2': '0.008', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.029', 'AMMO4': '0.040', 'HITCOUNT': '0.050', 'AMMO3': '0.062', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.150', 'weapon7': '0.152', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.258', 'WEAPON5': '0.300', 'weapon4': '0.326', 'weapon5': '0.366', 'WEAPON3': '0.400', 'weapon3': '1.044', 'weapon2': '1.532'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:51,441][63767] DAMAGECOUNT value on done: 11240.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:51,441][63767] Sum rewards: 0.925, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.484', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'AMMO5': '0.017', 'weapon4': '0.034', 'AMMO4': '0.082', 'WEAPON4': '0.100', 'AMMO3': '0.103', 'HITCOUNT': '0.120', 'weapon5': '0.202', 'DAMAGECOUNT': '0.300', 'WEAPON5': '0.350', 'ARMOR': '0.412', 'WEAPON3': '0.550', 'weapon2': '1.210', 'weapon3': '1.652', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:51,859][63732] Updated weights for policy 0, policy_version 1620 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:52,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11468.8, 300 sec: 11302.2). Total num frames: 12943360. Throughput: 0: 1547.2, 1: 1310.9. Samples: 3229880. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:52,460][109198] Avg episode reward: [(0, '-2.396'), (1, '-3.051')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:52,822][63733] Updated weights for policy 1, policy_version 1540 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:53,862][63805] DAMAGECOUNT value on done: 9898.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:53,862][63805] Sum rewards: -1.889, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.868', 'AMMO5': '0.012', 'AMMO2': '0.033', 'weapon7': '0.068', 'weapon5': '0.082', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.141', 'HITCOUNT': '0.150', 'AMMO4': '0.162', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.264', 'WEAPON3': '0.800', 'weapon2': '1.158', 'DAMAGECOUNT': '1.224', 'weapon3': '1.434', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:54,261][63805] DAMAGECOUNT value on done: 9931.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:54,262][63805] Sum rewards: -3.161, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.536', 'AMMO5': '0.017', 'AMMO2': '0.037', 'ARMOR': '0.044', 'HITCOUNT': '0.090', 'weapon5': '0.104', 'AMMO3': '0.135', 'AMMO4': '0.183', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.282', 'weapon4': '0.386', 'WEAPON4': '0.400', 'WEAPON3': '0.900', 'weapon2': '1.130', 'weapon3': '1.918', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:56,322][63770] DAMAGECOUNT value on done: 10010.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:56,322][63770] Sum rewards: -0.143, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.868', 'AMMO2': '0.010', 'AMMO5': '0.011', 'WEAPON4': '0.050', 'AMMO4': '0.051', 'weapon5': '0.134', 'AMMO3': '0.173', 'WEAPON5': '0.250', 'ARMOR': '0.400', 'HITCOUNT': '0.400', 'WEAPON3': '1.000', 'weapon2': '1.276', 'DAMAGECOUNT': '1.461', 'weapon3': '2.258', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:56,712][63770] DAMAGECOUNT value on done: 7233.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:56,712][63770] Sum rewards: -0.470, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.680', 'AMMO5': '0.003', 'AMMO2': '0.008', 'AMMO4': '0.039', 'WEAPON5': '0.050', 'weapon4': '0.082', 'WEAPON4': '0.150', 'AMMO3': '0.178', 'HITCOUNT': '0.220', 'ARMOR': '0.440', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.200', 'weapon3': '1.614', 'weapon2': '1.826', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:56,764][63806] DAMAGECOUNT value on done: 9163.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:56,785][63771] DAMAGECOUNT value on done: 9885.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:56,785][63771] Sum rewards: -4.456, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.530', 'AMMO4': '-0.030', 'AMMO2': '-0.006', 'AMMO5': '0.005', 'weapon5': '0.006', 'ARMOR': '0.024', 'WEAPON5': '0.100', 'AMMO3': '0.142', 'HITCOUNT': '0.230', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.900', 'weapon2': '1.302', 'FRAGCOUNT': '2.000', 'weapon3': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:57,162][63806] DAMAGECOUNT value on done: 8321.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:57,162][63806] Sum rewards: 1.196, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.089', 'AMMO2': '0.024', 'AMMO5': '0.030', 'WEAPON4': '0.100', 'AMMO3': '0.114', 'AMMO4': '0.118', 'HITCOUNT': '0.220', 'weapon5': '0.320', 'WEAPON5': '0.450', 'weapon4': '0.452', 'WEAPON3': '0.500', 'ARMOR': '0.557', 'DAMAGECOUNT': '0.702', 'weapon3': '1.348', 'weapon2': '1.350', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:57,173][63771] DAMAGECOUNT value on done: 7043.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:57,173][63771] Sum rewards: -5.124, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.028', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'WEAPON4': '0.050', 'AMMO3': '0.177', 'HITCOUNT': '0.240', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.140', 'weapon3': '1.722', 'weapon2': '1.800', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:57,458][109198] Fps is (10 sec: 11878.5, 60 sec: 11468.8, 300 sec: 11302.2). Total num frames: 13000704. Throughput: 0: 1568.9, 1: 1290.4. Samples: 3247253. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:55:57,460][109198] Avg episode reward: [(0, '-2.322'), (1, '-3.109')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:57,912][63732] Updated weights for policy 0, policy_version 1630 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:59,508][63735] DAMAGECOUNT value on done: 8686.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:59,508][63735] Sum rewards: -7.301, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.770', 'AMMO4': '-0.019', 'AMMO2': '-0.004', 'AMMO5': '0.025', 'weapon5': '0.052', 'AMMO3': '0.189', 'WEAPON5': '0.300', 'HITCOUNT': '0.320', 'DAMAGECOUNT': '0.996', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.790', 'weapon2': '1.820'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:59,822][63735] DAMAGECOUNT value on done: 9591.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:55:59,822][63735] Sum rewards: -2.823, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.159', 'AMMO4': '-0.003', 'AMMO2': '-0.000', 'AMMO5': '0.015', 'weapon5': '0.100', 'weapon4': '0.106', 'WEAPON4': '0.150', 'AMMO3': '0.180', 'WEAPON5': '0.300', 'HITCOUNT': '0.430', 'WEAPON3': '1.100', 'weapon2': '1.420', 'DAMAGECOUNT': '1.740', 'weapon3': '2.048', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:00,774][63733] Updated weights for policy 1, policy_version 1550 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:01,809][63734] DAMAGECOUNT value on done: 9358.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:01,810][63734] Sum rewards: 2.006, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.336', 'AMMO5': '0.019', 'AMMO2': '0.019', 'AMMO4': '0.096', 'ARMOR': '0.108', 'AMMO3': '0.143', 'WEAPON4': '0.150', 'weapon5': '0.150', 'HITCOUNT': '0.270', 'WEAPON5': '0.300', 'weapon4': '0.356', 'WEAPON3': '0.750', 'weapon2': '1.274', 'DAMAGECOUNT': '1.575', 'weapon3': '1.632', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:01,862][63734] DAMAGECOUNT value on done: 8306.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:01,862][63734] Sum rewards: -3.814, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.698', 'AMMO2': '0.003', 'AMMO5': '0.007', 'AMMO4': '0.015', 'WEAPON4': '0.050', 'weapon4': '0.096', 'AMMO3': '0.115', 'WEAPON5': '0.150', 'weapon5': '0.182', 'HITCOUNT': '0.210', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.750', 'ARMOR': '0.900', 'weapon2': '1.346', 'weapon3': '1.914'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:02,218][63734] DAMAGECOUNT value on done: 8633.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:02,218][63734] Sum rewards: -2.582, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.335', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'weapon5': '0.026', 'AMMO2': '0.033', 'ARMOR': '0.063', 'AMMO4': '0.163', 'HITCOUNT': '0.170', 'AMMO3': '0.173', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon4': '0.322', 'DAMAGECOUNT': '0.522', 'weapon2': '0.840', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '2.212'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:02,314][63734] DAMAGECOUNT value on done: 6403.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:02,315][63734] Sum rewards: -4.927, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.896', 'AMMO2': '0.001', 'AMMO4': '0.007', 'WEAPON1': '0.020', 'weapon4': '0.034', 'ARMOR': '0.048', 'WEAPON4': '0.100', 'HITCOUNT': '0.120', 'AMMO3': '0.131', 'DAMAGECOUNT': '0.372', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.646', 'weapon2': '1.690'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:02,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11468.8, 300 sec: 11316.1). Total num frames: 13058048. Throughput: 0: 1568.6, 1: 1293.1. Samples: 3255948. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:02,460][109198] Avg episode reward: [(0, '-2.345'), (1, '-3.097')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:03,989][63769] DAMAGECOUNT value on done: 9087.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:03,990][63769] Sum rewards: -3.758, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.851', 'AMMO2': '0.017', 'AMMO5': '0.028', 'WEAPON4': '0.050', 'weapon5': '0.056', 'AMMO4': '0.085', 'ARMOR': '0.144', 'AMMO3': '0.161', 'HITCOUNT': '0.180', 'weapon4': '0.180', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.555', 'WEAPON3': '1.050', 'weapon2': '1.092', 'FRAGCOUNT': '2.000', 'weapon3': '2.046'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:04,382][63769] DAMAGECOUNT value on done: 8523.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:04,383][63769] Sum rewards: -1.934, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.552', 'AMMO5': '0.013', 'AMMO2': '0.015', 'weapon5': '0.072', 'AMMO4': '0.072', 'AMMO3': '0.133', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'HITCOUNT': '0.260', 'weapon4': '0.464', 'ARMOR': '0.476', 'DAMAGECOUNT': '0.732', 'weapon2': '0.786', 'WEAPON3': '0.850', 'weapon3': '1.646', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:04,814][63767] DAMAGECOUNT value on done: 9782.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:04,814][63767] Sum rewards: -4.030, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.307', 'AMMO5': '0.003', 'AMMO2': '0.025', 'weapon5': '0.036', 'WEAPON5': '0.050', 'AMMO3': '0.114', 'AMMO4': '0.124', 'ARMOR': '0.144', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'weapon4': '0.414', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.792', 'WEAPON3': '0.800', 'weapon2': '1.162', 'weapon3': '1.694'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:04,890][63732] Updated weights for policy 0, policy_version 1640 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:05,180][63735] DAMAGECOUNT value on done: 8638.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:05,180][63735] Sum rewards: -2.481, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.418', 'AMMO2': '0.002', 'weapon5': '0.006', 'AMMO5': '0.010', 'AMMO4': '0.010', 'WEAPON4': '0.050', 'ARMOR': '0.072', 'WEAPON5': '0.100', 'weapon4': '0.100', 'AMMO3': '0.129', 'HITCOUNT': '0.200', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.687', 'FRAGCOUNT': '1.000', 'weapon3': '1.476', 'weapon2': '1.944'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:05,185][63767] DAMAGECOUNT value on done: 8723.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:05,186][63767] Sum rewards: 0.636, reward structure: {'DEATHCOUNT': '-9.750', 'AMMO5': '0.012', 'weapon4': '0.016', 'AMMO2': '0.017', 'WEAPON4': '0.050', 'AMMO4': '0.085', 'HEALTH': '0.113', 'AMMO3': '0.128', 'weapon5': '0.188', 'WEAPON5': '0.200', 'HITCOUNT': '0.280', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.164', 'weapon3': '1.610', 'weapon2': '1.872', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:05,528][63735] DAMAGECOUNT value on done: 6250.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:05,528][63735] Sum rewards: -3.283, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.854', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.005', 'weapon5': '0.018', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.128', 'weapon4': '0.130', 'HITCOUNT': '0.290', 'ARMOR': '0.442', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.005', 'weapon2': '1.236', 'weapon3': '1.962', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:05,632][63806] DAMAGECOUNT value on done: 7081.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:05,633][63806] Sum rewards: 0.525, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO5': '0.005', 'weapon5': '0.006', 'WEAPON1': '0.010', 'AMMO2': '0.023', 'WEAPON5': '0.050', 'weapon7': '0.074', 'AMMO3': '0.095', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO4': '0.115', 'WEAPON4': '0.150', 'HITCOUNT': '0.220', 'HEALTH': '0.368', 'weapon4': '0.394', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.930', 'weapon3': '1.174', 'weapon2': '1.360', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:06,021][63806] DAMAGECOUNT value on done: 9355.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:06,713][63805] DAMAGECOUNT value on done: 10643.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:06,714][63805] Sum rewards: -5.581, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.850', 'ARMOR': '0.004', 'AMMO2': '0.007', 'AMMO5': '0.007', 'AMMO4': '0.034', 'WEAPON5': '0.050', 'HITCOUNT': '0.080', 'weapon4': '0.114', 'AMMO3': '0.136', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.342', 'weapon3': '1.790'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:07,034][63805] DAMAGECOUNT value on done: 7266.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:07,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11468.8, 300 sec: 11330.0). Total num frames: 13115392. Throughput: 0: 1562.0, 1: 1311.7. Samples: 3273368. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:07,460][109198] Avg episode reward: [(0, '-2.290'), (1, '-3.180')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:07,840][63733] Updated weights for policy 1, policy_version 1560 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:07,942][63770] DAMAGECOUNT value on done: 7683.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:07,942][63770] Sum rewards: 2.704, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-0.885', 'AMMO2': '0.004', 'AMMO5': '0.007', 'AMMO4': '0.018', 'WEAPON1': '0.020', 'weapon7': '0.054', 'ARMOR': '0.072', 'AMMO3': '0.084', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'weapon5': '0.306', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.624', 'weapon3': '0.912', 'weapon2': '1.358', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:08,289][63770] DAMAGECOUNT value on done: 8010.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:08,290][63770] Sum rewards: -2.474, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.294', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.047', 'weapon5': '0.054', 'AMMO3': '0.062', 'HITCOUNT': '0.080', 'WEAPON5': '0.100', 'ARMOR': '0.108', 'WEAPON4': '0.200', 'weapon4': '0.240', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.450', 'weapon3': '0.826', 'weapon2': '1.808', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:09,413][63769] DAMAGECOUNT value on done: 9447.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:09,414][63769] Sum rewards: 0.571, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.700', 'AMMO2': '0.001', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO4': '0.006', 'ARMOR': '0.052', 'WEAPON5': '0.100', 'AMMO3': '0.120', 'HITCOUNT': '0.200', 'WEAPON4': '0.300', 'weapon4': '0.396', 'DAMAGECOUNT': '0.870', 'WEAPON3': '0.900', 'weapon2': '1.050', 'weapon3': '2.014', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:09,752][63769] DAMAGECOUNT value on done: 7214.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:11,266][63771] DAMAGECOUNT value on done: 6563.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:11,267][63771] Sum rewards: -1.060, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.638', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'ARMOR': '0.020', 'weapon7': '0.026', 'AMMO2': '0.036', 'AMMO3': '0.103', 'weapon5': '0.126', 'WEAPON5': '0.150', 'AMMO4': '0.180', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON4': '0.250', 'weapon4': '0.298', 'HITCOUNT': '0.300', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.317', 'weapon2': '1.584', 'weapon3': '1.660', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:11,594][63771] DAMAGECOUNT value on done: 9090.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:11,594][63771] Sum rewards: 2.349, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.424', 'AMMO5': '0.003', 'AMMO2': '0.012', 'weapon5': '0.026', 'WEAPON5': '0.050', 'AMMO4': '0.061', 'AMMO3': '0.097', 'WEAPON4': '0.150', 'weapon4': '0.336', 'HITCOUNT': '0.430', 'WEAPON3': '0.500', 'ARMOR': '0.505', 'weapon2': '1.210', 'DAMAGECOUNT': '1.389', 'weapon3': '1.504', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:11,988][63732] Updated weights for policy 0, policy_version 1650 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:12,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11468.8, 300 sec: 11330.0). Total num frames: 13172736. Throughput: 0: 1553.3, 1: 1326.6. Samples: 3290675. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:12,460][109198] Avg episode reward: [(0, '-2.179'), (1, '-3.175')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:13,520][63767] DAMAGECOUNT value on done: 10394.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:13,520][63767] Sum rewards: -6.370, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.306', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.012', 'weapon5': '0.048', 'WEAPON4': '0.100', 'weapon4': '0.124', 'WEAPON5': '0.150', 'AMMO3': '0.176', 'HITCOUNT': '0.310', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.548', 'weapon3': '1.778', 'weapon2': '1.786'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:13,840][63767] DAMAGECOUNT value on done: 11870.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:13,840][63767] Sum rewards: 0.744, reward structure: {'DEATHCOUNT': '-11.250', 'ARMOR': '0.008', 'AMMO5': '0.012', 'AMMO2': '0.042', 'AMMO3': '0.148', 'weapon4': '0.162', 'WEAPON5': '0.200', 'AMMO4': '0.211', 'WEAPON4': '0.350', 'weapon5': '0.360', 'HEALTH': '0.430', 'HITCOUNT': '0.430', 'WEAPON3': '0.750', 'weapon2': '0.866', 'DAMAGECOUNT': '1.890', 'weapon3': '2.134', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:14,526][63769] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:14,875][63733] Updated weights for policy 1, policy_version 1570 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:16,787][63805] DAMAGECOUNT value on done: 10098.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:17,182][63805] DAMAGECOUNT value on done: 10311.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:17,182][63805] Sum rewards: 0.792, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.152', 'AMMO5': '0.005', 'AMMO2': '0.024', 'weapon7': '0.044', 'ARMOR': '0.045', 'WEAPON5': '0.100', 'AMMO3': '0.103', 'AMMO4': '0.121', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.234', 'HITCOUNT': '0.330', 'WEAPON4': '0.400', 'WEAPON3': '0.500', 'weapon4': '0.714', 'weapon3': '1.092', 'DAMAGECOUNT': '1.140', 'weapon2': '1.492', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:17,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11468.8, 300 sec: 11343.8). Total num frames: 13230080. Throughput: 0: 1549.2, 1: 1333.5. Samples: 3299405. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:17,460][109198] Avg episode reward: [(0, '-2.168'), (1, '-3.175')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:18,901][63806] DAMAGECOUNT value on done: 9313.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:18,901][63806] Sum rewards: -5.330, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.706', 'AMMO5': '0.008', 'AMMO2': '0.012', 'AMMO4': '0.058', 'weapon5': '0.070', 'ARMOR': '0.090', 'WEAPON4': '0.100', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'AMMO3': '0.163', 'weapon4': '0.166', 'DAMAGECOUNT': '0.450', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.750', 'weapon3': '1.598', 'weapon2': '1.612'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:19,340][63806] DAMAGECOUNT value on done: 8578.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:19,341][63806] Sum rewards: -2.428, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.494', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'AMMO2': '0.022', 'WEAPON4': '0.050', 'ARMOR': '0.052', 'WEAPON5': '0.100', 'AMMO4': '0.112', 'AMMO3': '0.128', 'HITCOUNT': '0.230', 'DAMAGECOUNT': '0.771', 'WEAPON3': '0.800', 'weapon2': '1.568', 'weapon3': '1.958', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:19,375][63732] Updated weights for policy 0, policy_version 1660 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:20,132][63771] DAMAGECOUNT value on done: 9962.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:20,133][63771] Sum rewards: -5.833, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.433', 'AMMO2': '0.007', 'AMMO4': '0.035', 'HITCOUNT': '0.080', 'AMMO3': '0.120', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.231', 'weapon4': '0.254', 'ARMOR': '0.488', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.460', 'weapon2': '1.574'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:20,472][63771] DAMAGECOUNT value on done: 7198.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:20,473][63771] Sum rewards: -3.231, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.003', 'weapon4': '0.012', 'WEAPON1': '0.020', 'AMMO2': '0.020', 'HEALTH': '0.046', 'WEAPON5': '0.050', 'ARMOR': '0.060', 'AMMO4': '0.101', 'AMMO3': '0.104', 'weapon5': '0.124', 'HITCOUNT': '0.140', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.600', 'weapon2': '1.456', 'weapon3': '1.668'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:20,551][63771] Large shaping reward 2.642 for [('FRAGCOUNT', 2.0, 2.0), ('HITCOUNT', 0.04, 4.0), ('DAMAGECOUNT', 0.6, 200), ('weapon7', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:22,210][63770] DAMAGECOUNT value on done: 10529.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:22,210][63770] Sum rewards: 1.222, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.704', 'AMMO2': '0.008', 'AMMO5': '0.017', 'AMMO4': '0.039', 'weapon7': '0.046', 'weapon4': '0.060', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.153', 'HITCOUNT': '0.220', 'WEAPON5': '0.300', 'weapon5': '0.430', 'ARMOR': '0.496', 'WEAPON3': '0.750', 'weapon3': '1.172', 'weapon2': '1.528', 'DAMAGECOUNT': '1.557', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:22,458][109198] Fps is (10 sec: 10649.6, 60 sec: 11400.6, 300 sec: 11316.1). Total num frames: 13279232. Throughput: 0: 1519.9, 1: 1332.6. Samples: 3315362. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:22,459][109198] Avg episode reward: [(0, '-2.145'), (1, '-3.175')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:22,470][63733] Updated weights for policy 1, policy_version 1580 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:22,708][63770] DAMAGECOUNT value on done: 7407.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:22,709][63770] Sum rewards: -1.564, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.738', 'AMMO5': '0.003', 'AMMO2': '0.020', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'AMMO4': '0.100', 'AMMO3': '0.107', 'HITCOUNT': '0.180', 'WEAPON4': '0.250', 'weapon4': '0.304', 'DAMAGECOUNT': '0.522', 'WEAPON3': '0.700', 'weapon2': '1.320', 'weapon3': '1.798', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:25,872][63735] DAMAGECOUNT value on done: 8826.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:25,872][63735] Sum rewards: 1.067, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.506', 'AMMO5': '0.005', 'AMMO2': '0.009', 'ARMOR': '0.032', 'AMMO4': '0.042', 'weapon5': '0.076', 'AMMO3': '0.089', 'WEAPON5': '0.100', 'HITCOUNT': '0.130', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.550', 'weapon2': '1.226', 'weapon3': '1.394', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:26,240][63735] DAMAGECOUNT value on done: 10096.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:26,240][63735] Sum rewards: 1.351, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.830', 'AMMO2': '0.015', 'AMMO5': '0.028', 'AMMO4': '0.073', 'WEAPON4': '0.100', 'AMMO3': '0.142', 'weapon5': '0.262', 'weapon4': '0.264', 'WEAPON5': '0.300', 'HITCOUNT': '0.400', 'WEAPON3': '0.900', 'weapon2': '1.326', 'DAMAGECOUNT': '1.515', 'weapon3': '1.856', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:26,416][63734] DAMAGECOUNT value on done: 9493.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:26,417][63734] Sum rewards: -3.791, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.870', 'FRAGCOUNT': '-1.500', 'AMMO4': '-0.041', 'AMMO2': '-0.008', 'AMMO5': '0.018', 'ARMOR': '0.056', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.104', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.127', 'weapon5': '0.130', 'weapon7': '0.198', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.800', 'weapon3': '1.118', 'weapon2': '1.932'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:26,787][63734] DAMAGECOUNT value on done: 9063.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:26,787][63734] Sum rewards: -0.942, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.514', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.012', 'AMMO4': '0.057', 'weapon4': '0.124', 'ARMOR': '0.141', 'weapon5': '0.144', 'WEAPON4': '0.150', 'AMMO3': '0.177', 'WEAPON5': '0.200', 'HITCOUNT': '0.290', 'WEAPON3': '1.050', 'weapon2': '1.282', 'DAMAGECOUNT': '1.290', 'weapon3': '2.138', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:27,458][109198] Fps is (10 sec: 10240.0, 60 sec: 11264.0, 300 sec: 11316.1). Total num frames: 13332480. Throughput: 0: 1477.4, 1: 1327.1. Samples: 3330401. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:27,460][109198] Avg episode reward: [(0, '-2.143'), (1, '-3.235')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:27,467][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001586_6496256.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:27,467][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001669_6836224.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:27,523][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001274_5218304.pth\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:27,526][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001314_5382144.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:27,891][63732] Updated weights for policy 0, policy_version 1670 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:28,114][63734] DAMAGECOUNT value on done: 8757.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:28,114][63734] Sum rewards: -0.023, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.475', 'AMMO2': '0.008', 'AMMO5': '0.015', 'AMMO4': '0.041', 'WEAPON4': '0.050', 'weapon5': '0.126', 'AMMO3': '0.147', 'weapon4': '0.194', 'WEAPON5': '0.250', 'HITCOUNT': '0.390', 'ARMOR': '0.416', 'WEAPON3': '0.900', 'weapon2': '0.966', 'DAMAGECOUNT': '1.353', 'weapon3': '2.346', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:28,308][63806] DAMAGECOUNT value on done: 7348.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:28,483][63734] DAMAGECOUNT value on done: 6742.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:28,484][63734] Sum rewards: -4.219, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.343', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'weapon5': '0.002', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'ARMOR': '0.044', 'weapon4': '0.058', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.170', 'HITCOUNT': '0.200', 'DAMAGECOUNT': '1.017', 'weapon2': '1.142', 'WEAPON3': '1.150', 'weapon3': '2.402', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:28,747][63806] DAMAGECOUNT value on done: 9434.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:28,785][63767] DAMAGECOUNT value on done: 9977.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:28,973][63769] DAMAGECOUNT value on done: 9342.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:28,973][63769] Sum rewards: -1.064, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.261', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.028', 'WEAPON4': '0.050', 'AMMO3': '0.114', 'weapon4': '0.134', 'AMMO4': '0.138', 'WEAPON5': '0.200', 'weapon5': '0.246', 'HITCOUNT': '0.260', 'ARMOR': '0.440', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.765', 'FRAGCOUNT': '1.000', 'weapon3': '1.576', 'weapon2': '1.826'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:29,150][63767] DAMAGECOUNT value on done: 9339.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:29,151][63767] Sum rewards: 2.088, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.200', 'AMMO5': '0.005', 'AMMO2': '0.007', 'AMMO4': '0.033', 'weapon5': '0.098', 'WEAPON5': '0.100', 'AMMO3': '0.101', 'weapon4': '0.174', 'WEAPON4': '0.200', 'ARMOR': '0.400', 'HITCOUNT': '0.420', 'WEAPON3': '0.700', 'weapon2': '1.284', 'weapon3': '1.668', 'DAMAGECOUNT': '1.848', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:29,338][63769] DAMAGECOUNT value on done: 8872.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:29,339][63769] Sum rewards: -4.811, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.128', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'AMMO5': '0.014', 'ARMOR': '0.068', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.150', 'AMMO3': '0.156', 'weapon5': '0.156', 'weapon4': '0.268', 'WEAPON5': '0.300', 'HITCOUNT': '0.310', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.047', 'weapon2': '1.364', 'weapon3': '1.786'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:29,611][63735] DAMAGECOUNT value on done: 8938.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:29,611][63735] Sum rewards: -1.449, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.660', 'AMMO2': '0.033', 'ARMOR': '0.072', 'AMMO3': '0.115', 'AMMO4': '0.167', 'WEAPON4': '0.200', 'HITCOUNT': '0.240', 'weapon4': '0.338', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.900', 'weapon3': '0.978', 'FRAGCOUNT': '1.000', 'weapon2': '2.168'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:29,929][63735] DAMAGECOUNT value on done: 6575.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:29,929][63735] Sum rewards: -2.709, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.534', 'AMMO2': '0.005', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.027', 'weapon5': '0.028', 'AMMO3': '0.121', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.975', 'weapon3': '1.742', 'weapon2': '1.744', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:30,202][63733] Updated weights for policy 1, policy_version 1590 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:30,729][63805] DAMAGECOUNT value on done: 10768.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:30,729][63805] Sum rewards: 1.332, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.760', 'AMMO2': '0.008', 'AMMO5': '0.012', 'weapon5': '0.016', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'AMMO4': '0.041', 'WEAPON4': '0.050', 'AMMO3': '0.071', 'HITCOUNT': '0.120', 'weapon4': '0.134', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.500', 'weapon3': '1.350', 'weapon2': '1.694', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:31,136][63805] DAMAGECOUNT value on done: 7641.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:31,136][63805] Sum rewards: -3.823, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.862', 'AMMO2': '0.007', 'AMMO5': '0.012', 'ARMOR': '0.024', 'AMMO4': '0.037', 'AMMO3': '0.127', 'weapon5': '0.128', 'HITCOUNT': '0.190', 'WEAPON5': '0.250', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.125', 'weapon2': '1.500', 'weapon3': '1.688'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:32,458][109198] Fps is (10 sec: 10649.5, 60 sec: 11264.0, 300 sec: 11302.2). Total num frames: 13385728. Throughput: 0: 1457.7, 1: 1337.4. Samples: 3338515. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:32,460][109198] Avg episode reward: [(0, '-2.151'), (1, '-3.309')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:33,293][63769] DAMAGECOUNT value on done: 9467.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:33,673][63769] DAMAGECOUNT value on done: 7368.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:34,495][63770] DAMAGECOUNT value on done: 8109.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:34,496][63770] Sum rewards: 0.245, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.984', 'AMMO2': '0.019', 'weapon4': '0.040', 'ARMOR': '0.068', 'AMMO4': '0.094', 'WEAPON4': '0.100', 'AMMO3': '0.154', 'HITCOUNT': '0.340', 'WEAPON3': '0.950', 'DAMAGECOUNT': '1.278', 'weapon2': '1.422', 'weapon3': '2.264', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:34,683][63732] Updated weights for policy 0, policy_version 1680 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:34,952][63770] DAMAGECOUNT value on done: 8090.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:34,953][63770] Sum rewards: -5.176, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.909', 'AMMO2': '0.008', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'AMMO4': '0.039', 'weapon4': '0.062', 'weapon5': '0.068', 'HITCOUNT': '0.080', 'ARMOR': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.161', 'DAMAGECOUNT': '0.240', 'WEAPON5': '0.250', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.490', 'weapon3': '1.872'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:36,222][63771] DAMAGECOUNT value on done: 7027.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:36,223][63771] Sum rewards: -1.728, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.405', 'AMMO4': '-0.074', 'AMMO2': '-0.015', 'AMMO5': '0.006', 'WEAPON4': '0.100', 'AMMO3': '0.121', 'weapon5': '0.142', 'WEAPON5': '0.150', 'weapon4': '0.196', 'HITCOUNT': '0.330', 'ARMOR': '0.489', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.950', 'weapon2': '1.246', 'DAMAGECOUNT': '1.392', 'weapon3': '1.894'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:36,558][63771] DAMAGECOUNT value on done: 9774.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:36,559][63771] Sum rewards: 4.506, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.812', 'AMMO2': '0.001', 'AMMO4': '0.002', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'ARMOR': '0.036', 'weapon7': '0.062', 'AMMO3': '0.096', 'WEAPON5': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'HITCOUNT': '0.310', 'WEAPON3': '0.550', 'weapon2': '1.462', 'weapon3': '1.604', 'DAMAGECOUNT': '1.890', 'FRAGCOUNT': '7.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:37,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11264.0, 300 sec: 11330.0). Total num frames: 13447168. Throughput: 0: 1438.7, 1: 1355.6. Samples: 3355622. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:37,460][109198] Avg episode reward: [(0, '-2.096'), (1, '-3.311')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:37,471][63454] Saving new best policy, reward=-2.096!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:37,927][63767] DAMAGECOUNT value on done: 10782.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:37,927][63767] Sum rewards: 0.319, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.932', 'AMMO2': '0.004', 'AMMO5': '0.009', 'AMMO4': '0.018', 'WEAPON1': '0.020', 'weapon7': '0.048', 'WEAPON4': '0.050', 'AMMO3': '0.072', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon4': '0.158', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'weapon5': '0.310', 'ARMOR': '0.479', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.164', 'weapon2': '1.204', 'weapon3': '1.214'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:38,087][63733] Updated weights for policy 1, policy_version 1600 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:38,267][63767] DAMAGECOUNT value on done: 12272.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:38,267][63767] Sum rewards: -2.446, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.778', 'AMMO2': '0.015', 'AMMO5': '0.020', 'ARMOR': '0.040', 'AMMO4': '0.074', 'WEAPON4': '0.100', 'weapon5': '0.114', 'AMMO3': '0.123', 'weapon4': '0.204', 'HITCOUNT': '0.260', 'WEAPON5': '0.350', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.206', 'weapon2': '1.358', 'weapon3': '1.618', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:41,061][63732] Updated weights for policy 0, policy_version 1690 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:41,760][63806] DAMAGECOUNT value on done: 9433.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:41,761][63806] Sum rewards: -4.980, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.854', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'AMMO5': '0.005', 'ARMOR': '0.036', 'HITCOUNT': '0.070', 'weapon5': '0.076', 'WEAPON5': '0.100', 'AMMO3': '0.157', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.750', 'weapon2': '1.410', 'weapon3': '1.936'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:41,779][63805] DAMAGECOUNT value on done: 10217.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:41,779][63805] Sum rewards: 0.853, reward structure: {'DEATHCOUNT': '-5.250', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'AMMO2': '0.027', 'AMMO3': '0.092', 'HITCOUNT': '0.130', 'AMMO4': '0.135', 'WEAPON5': '0.300', 'weapon5': '0.308', 'DAMAGECOUNT': '0.357', 'WEAPON3': '0.400', 'HEALTH': '0.498', 'FRAGCOUNT': '1.000', 'weapon2': '1.190', 'weapon3': '1.638'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:42,071][63806] DAMAGECOUNT value on done: 8699.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:42,120][63805] DAMAGECOUNT value on done: 10478.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:42,120][63805] Sum rewards: -8.578, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.058', 'AMMO2': '0.007', 'ARMOR': '0.016', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'AMMO4': '0.034', 'weapon4': '0.078', 'AMMO3': '0.115', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'WEAPON5': '0.300', 'weapon5': '0.434', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.501', 'WEAPON3': '0.700', 'weapon3': '1.222', 'weapon2': '1.986'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:42,458][109198] Fps is (10 sec: 11878.4, 60 sec: 11264.0, 300 sec: 11330.0). Total num frames: 13504512. Throughput: 0: 1428.2, 1: 1361.6. Samples: 3372793. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:42,460][109198] Avg episode reward: [(0, '-2.017'), (1, '-3.421')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:42,462][63454] Saving new best policy, reward=-2.017!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:43,540][63771] DAMAGECOUNT value on done: 10180.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:43,540][63771] Sum rewards: -4.373, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.157', 'AMMO4': '-0.046', 'AMMO2': '-0.009', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'ARMOR': '0.020', 'weapon5': '0.072', 'AMMO3': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.210', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.654', 'FRAGCOUNT': '1.000', 'weapon3': '1.548', 'weapon2': '1.820'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:43,926][63771] DAMAGECOUNT value on done: 7333.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:43,927][63771] Sum rewards: -3.539, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.300', 'AMMO2': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'HITCOUNT': '0.080', 'AMMO4': '0.086', 'AMMO3': '0.106', 'WEAPON4': '0.150', 'weapon4': '0.268', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.268', 'weapon2': '1.974'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:46,190][63733] Updated weights for policy 1, policy_version 1610 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:47,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11264.0, 300 sec: 11330.0). Total num frames: 13557760. Throughput: 0: 1435.2, 1: 1352.8. Samples: 3381411. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:47,460][109198] Avg episode reward: [(0, '-2.017'), (1, '-3.434')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:47,499][63732] Updated weights for policy 0, policy_version 1700 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:48,374][63770] DAMAGECOUNT value on done: 10706.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:48,375][63770] Sum rewards: -2.738, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.214', 'AMMO2': '0.013', 'AMMO5': '0.015', 'ARMOR': '0.049', 'AMMO4': '0.064', 'AMMO3': '0.090', 'WEAPON4': '0.150', 'HITCOUNT': '0.160', 'weapon5': '0.240', 'WEAPON5': '0.250', 'weapon4': '0.256', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.531', 'weapon3': '1.442', 'weapon2': '1.716'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:48,820][63770] DAMAGECOUNT value on done: 7632.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:50,156][63734] DAMAGECOUNT value on done: 9722.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:50,157][63734] Sum rewards: -4.873, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.282', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'AMMO5': '0.011', 'ARMOR': '0.016', 'weapon5': '0.126', 'HITCOUNT': '0.140', 'AMMO3': '0.197', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.687', 'WEAPON3': '0.950', 'weapon2': '1.364', 'FRAGCOUNT': '2.000', 'weapon3': '2.200'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:50,379][63735] DAMAGECOUNT value on done: 8998.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:50,379][63735] Sum rewards: -5.852, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.575', 'AMMO5': '0.005', 'AMMO2': '0.007', 'AMMO4': '0.034', 'WEAPON5': '0.050', 'ARMOR': '0.088', 'WEAPON4': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.147', 'weapon4': '0.198', 'DAMAGECOUNT': '0.516', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.380', 'weapon2': '1.958'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:50,481][63734] DAMAGECOUNT value on done: 9302.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:50,482][63734] Sum rewards: 1.310, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.013', 'weapon4': '0.022', 'AMMO2': '0.024', 'weapon5': '0.042', 'WEAPON4': '0.050', 'HEALTH': '0.064', 'AMMO3': '0.093', 'AMMO4': '0.118', 'WEAPON5': '0.150', 'HITCOUNT': '0.200', 'ARMOR': '0.536', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.717', 'FRAGCOUNT': '1.000', 'weapon3': '1.430', 'weapon2': '1.552'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:50,786][63735] DAMAGECOUNT value on done: 10720.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:50,786][63735] Sum rewards: -1.223, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.202', 'AMMO2': '0.007', 'AMMO5': '0.019', 'AMMO4': '0.035', 'weapon4': '0.110', 'AMMO3': '0.127', 'WEAPON4': '0.200', 'HITCOUNT': '0.340', 'weapon5': '0.344', 'WEAPON5': '0.350', 'WEAPON3': '0.850', 'ARMOR': '0.924', 'weapon3': '1.350', 'DAMAGECOUNT': '1.872', 'weapon2': '1.950', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:51,632][63767] DAMAGECOUNT value on done: 10362.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:51,632][63767] Sum rewards: 1.111, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.381', 'AMMO2': '0.011', 'ARMOR': '0.032', 'AMMO4': '0.057', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON4': '0.100', 'weapon7': '0.100', 'AMMO3': '0.175', 'weapon4': '0.248', 'HITCOUNT': '0.300', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.155', 'weapon2': '1.712', 'weapon3': '1.752', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:51,863][63735] DAMAGECOUNT value on done: 9072.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:51,864][63735] Sum rewards: 0.094, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.724', 'AMMO4': '-0.031', 'AMMO2': '-0.006', 'AMMO5': '0.005', 'AMMO3': '0.054', 'weapon5': '0.062', 'WEAPON5': '0.100', 'HITCOUNT': '0.130', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.402', 'weapon3': '1.110', 'weapon2': '1.842', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:52,042][63767] DAMAGECOUNT value on done: 9484.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:52,196][63769] DAMAGECOUNT value on done: 9482.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:52,197][63769] Sum rewards: -4.544, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.024', 'WEAPON1': '0.010', 'AMMO5': '0.020', 'AMMO2': '0.033', 'ARMOR': '0.036', 'HITCOUNT': '0.100', 'AMMO3': '0.130', 'AMMO4': '0.165', 'weapon5': '0.172', 'weapon4': '0.178', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.420', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.850', 'weapon2': '1.346', 'weapon3': '1.920'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:52,280][63735] DAMAGECOUNT value on done: 6925.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:52,280][63735] Sum rewards: -1.649, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.949', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'weapon5': '0.016', 'ARMOR': '0.068', 'AMMO3': '0.092', 'WEAPON5': '0.100', 'HITCOUNT': '0.250', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.050', 'weapon2': '1.438', 'FRAGCOUNT': '1.500', 'weapon3': '1.666'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:52,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11195.7, 300 sec: 11330.0). Total num frames: 13615104. Throughput: 0: 1455.9, 1: 1324.4. Samples: 3398479. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:52,460][109198] Avg episode reward: [(0, '-1.873'), (1, '-3.440')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:52,462][63454] Saving new best policy, reward=-1.873!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:52,555][63769] DAMAGECOUNT value on done: 9071.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:52,693][63806] DAMAGECOUNT value on done: 7635.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:52,693][63806] Sum rewards: -0.864, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.663', 'AMMO2': '0.006', 'AMMO5': '0.007', 'AMMO4': '0.029', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'weapon7': '0.080', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon5': '0.104', 'AMMO3': '0.122', 'WEAPON5': '0.150', 'weapon4': '0.204', 'HITCOUNT': '0.230', 'weapon2': '0.776', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.861', 'weapon3': '2.048', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:53,057][63806] DAMAGECOUNT value on done: 9519.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:53,057][63806] Sum rewards: -2.024, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.708', 'AMMO5': '0.003', 'AMMO2': '0.007', 'weapon5': '0.014', 'AMMO4': '0.033', 'WEAPON5': '0.050', 'ARMOR': '0.063', 'HITCOUNT': '0.070', 'AMMO3': '0.074', 'WEAPON4': '0.100', 'weapon4': '0.224', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.312', 'weapon2': '1.730'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:53,201][63805] DAMAGECOUNT value on done: 10783.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:53,245][63734] DAMAGECOUNT value on done: 8940.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:53,245][63734] Sum rewards: -6.650, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.842', 'FRAGCOUNT': '-0.500', 'weapon4': '0.004', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.017', 'ARMOR': '0.052', 'AMMO4': '0.086', 'WEAPON4': '0.100', 'weapon5': '0.146', 'AMMO3': '0.163', 'HITCOUNT': '0.170', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.549', 'WEAPON3': '0.750', 'weapon2': '1.574', 'weapon3': '2.058'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:53,518][63805] DAMAGECOUNT value on done: 7958.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:53,518][63805] Sum rewards: -4.586, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.968', 'AMMO2': '0.000', 'AMMO4': '0.001', 'AMMO5': '0.015', 'weapon5': '0.042', 'ARMOR': '0.056', 'AMMO3': '0.170', 'WEAPON5': '0.200', 'HITCOUNT': '0.270', 'DAMAGECOUNT': '0.951', 'WEAPON3': '1.000', 'weapon2': '1.550', 'weapon3': '1.626', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:53,571][63734] DAMAGECOUNT value on done: 7125.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:53,572][63734] Sum rewards: -0.477, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.418', 'AMMO2': '0.015', 'AMMO4': '0.075', 'WEAPON4': '0.100', 'AMMO3': '0.110', 'ARMOR': '0.116', 'weapon4': '0.128', 'HITCOUNT': '0.320', 'WEAPON3': '0.450', 'DAMAGECOUNT': '1.149', 'weapon3': '1.206', 'weapon2': '2.022', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:53,834][63732] Updated weights for policy 0, policy_version 1710 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:54,664][63733] Updated weights for policy 1, policy_version 1620 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:57,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11195.7, 300 sec: 11357.7). Total num frames: 13672448. Throughput: 0: 1491.7, 1: 1280.3. Samples: 3415414. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:56:57,460][109198] Avg episode reward: [(0, '-1.831'), (1, '-3.432')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:57,466][63454] Saving new best policy, reward=-1.831!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:58,155][63769] DAMAGECOUNT value on done: 9777.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:58,156][63769] Sum rewards: -2.985, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.888', 'weapon7': '0.004', 'AMMO5': '0.015', 'weapon5': '0.028', 'AMMO2': '0.029', 'ARMOR': '0.040', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.139', 'weapon4': '0.140', 'AMMO4': '0.142', 'WEAPON5': '0.200', 'HITCOUNT': '0.250', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.930', 'WEAPON3': '0.950', 'weapon2': '1.350', 'weapon3': '2.086', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:58,623][63769] DAMAGECOUNT value on done: 7443.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:58,623][63769] Sum rewards: -5.758, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.272', 'AMMO5': '0.003', 'AMMO2': '0.012', 'weapon5': '0.026', 'WEAPON5': '0.050', 'ARMOR': '0.059', 'AMMO4': '0.059', 'HITCOUNT': '0.070', 'AMMO3': '0.140', 'DAMAGECOUNT': '0.225', 'WEAPON4': '0.250', 'weapon4': '0.344', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.092', 'weapon3': '1.884'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:59,622][63771] DAMAGECOUNT value on done: 7454.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:59,622][63771] Sum rewards: 1.036, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.984', 'WEAPON1': '0.020', 'AMMO2': '0.020', 'AMMO5': '0.023', 'weapon5': '0.080', 'ARMOR': '0.088', 'AMMO4': '0.100', 'AMMO3': '0.125', 'weapon4': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.350', 'HITCOUNT': '0.360', 'WEAPON3': '0.800', 'weapon2': '1.250', 'DAMAGECOUNT': '1.281', 'weapon3': '2.144', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:59,789][63732] Updated weights for policy 0, policy_version 1720 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:59,942][63770] DAMAGECOUNT value on done: 8490.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:56:59,942][63770] Sum rewards: 0.728, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.412', 'AMMO2': '0.007', 'AMMO5': '0.017', 'AMMO4': '0.033', 'ARMOR': '0.036', 'weapon5': '0.076', 'AMMO3': '0.184', 'WEAPON5': '0.300', 'HITCOUNT': '0.330', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.143', 'weapon2': '1.540', 'weapon3': '2.224', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:00,024][63771] DAMAGECOUNT value on done: 10151.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:00,025][63771] Sum rewards: -0.832, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.789', 'AMMO2': '0.006', 'AMMO5': '0.028', 'AMMO4': '0.028', 'ARMOR': '0.040', 'AMMO3': '0.144', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'weapon5': '0.282', 'weapon4': '0.374', 'WEAPON5': '0.550', 'WEAPON3': '0.800', 'weapon2': '1.050', 'DAMAGECOUNT': '1.131', 'weapon3': '1.854', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:00,407][63770] DAMAGECOUNT value on done: 8110.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:00,839][63767] DAMAGECOUNT value on done: 10909.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:00,840][63767] Sum rewards: -1.698, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.974', 'AMMO2': '0.013', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'AMMO4': '0.062', 'WEAPON4': '0.100', 'HITCOUNT': '0.130', 'AMMO3': '0.149', 'weapon4': '0.162', 'weapon5': '0.256', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.381', 'ARMOR': '0.404', 'WEAPON3': '0.950', 'weapon2': '1.090', 'weapon3': '2.192', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:01,250][63767] DAMAGECOUNT value on done: 12499.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:01,251][63767] Sum rewards: 4.713, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.047', 'AMMO5': '0.007', 'weapon5': '0.034', 'AMMO2': '0.037', 'AMMO3': '0.083', 'WEAPON5': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon7': '0.126', 'HITCOUNT': '0.140', 'WEAPON4': '0.150', 'AMMO4': '0.183', 'WEAPON7': '0.200', 'weapon4': '0.268', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.681', 'ARMOR': '0.836', 'weapon2': '1.268', 'weapon3': '1.456', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:02,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11195.7, 300 sec: 11357.7). Total num frames: 13729792. Throughput: 0: 1508.5, 1: 1251.5. Samples: 3423604. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:02,460][109198] Avg episode reward: [(0, '-1.587'), (1, '-3.463')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:02,461][63454] Saving new best policy, reward=-1.587!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:03,658][63806] DAMAGECOUNT value on done: 9583.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:03,659][63806] Sum rewards: -2.526, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.232', 'AMMO2': '0.003', 'AMMO5': '0.013', 'AMMO4': '0.016', 'WEAPON1': '0.020', 'weapon5': '0.036', 'weapon4': '0.044', 'ARMOR': '0.076', 'AMMO3': '0.088', 'WEAPON4': '0.100', 'HITCOUNT': '0.130', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.048', 'weapon2': '2.332'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:03,983][63806] DAMAGECOUNT value on done: 8925.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:03,984][63806] Sum rewards: -3.201, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.615', 'AMMO2': '0.006', 'WEAPON1': '0.010', 'AMMO5': '0.019', 'ARMOR': '0.024', 'AMMO4': '0.029', 'WEAPON4': '0.050', 'weapon5': '0.066', 'AMMO3': '0.129', 'HITCOUNT': '0.190', 'weapon4': '0.206', 'WEAPON5': '0.300', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.678', 'WEAPON3': '0.800', 'weapon2': '1.016', 'weapon3': '1.890'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:04,198][63733] Updated weights for policy 1, policy_version 1630 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:05,050][63805] DAMAGECOUNT value on done: 10497.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:05,050][63805] Sum rewards: -1.902, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.410', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'AMMO2': '0.026', 'weapon5': '0.054', 'weapon7': '0.096', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.114', 'AMMO4': '0.129', 'WEAPON4': '0.200', 'weapon4': '0.230', 'HITCOUNT': '0.240', 'DAMAGECOUNT': '0.840', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.236', 'weapon3': '1.794'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:05,352][63805] DAMAGECOUNT value on done: 10838.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:05,352][63805] Sum rewards: 0.579, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.230', 'AMMO5': '0.020', 'ARMOR': '0.032', 'AMMO2': '0.038', 'weapon4': '0.056', 'WEAPON4': '0.100', 'AMMO3': '0.156', 'AMMO4': '0.187', 'weapon5': '0.284', 'HITCOUNT': '0.290', 'WEAPON5': '0.300', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.080', 'weapon2': '1.416', 'weapon3': '1.950', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:05,625][63732] Updated weights for policy 0, policy_version 1730 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:06,391][63771] DAMAGECOUNT value on done: 10499.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:06,392][63771] Sum rewards: -2.698, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.632', 'AMMO2': '0.001', 'AMMO4': '0.002', 'AMMO5': '0.014', 'WEAPON4': '0.050', 'AMMO3': '0.077', 'weapon4': '0.100', 'weapon5': '0.156', 'HITCOUNT': '0.190', 'WEAPON5': '0.350', 'ARMOR': '0.400', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.957', 'weapon3': '1.114', 'weapon2': '1.972'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:06,725][63771] DAMAGECOUNT value on done: 7588.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:06,725][63771] Sum rewards: -0.021, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.097', 'WEAPON1': '0.010', 'AMMO2': '0.034', 'AMMO3': '0.069', 'AMMO4': '0.171', 'HITCOUNT': '0.200', 'weapon4': '0.258', 'WEAPON4': '0.350', 'ARMOR': '0.404', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.765', 'weapon3': '0.994', 'weapon2': '1.870', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:07,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11127.5, 300 sec: 11343.8). Total num frames: 13783040. Throughput: 0: 1565.9, 1: 1213.5. Samples: 3440433. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:07,460][109198] Avg episode reward: [(0, '-1.663'), (1, '-3.357')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:11,449][63732] Updated weights for policy 0, policy_version 1740 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:12,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11127.5, 300 sec: 11357.7). Total num frames: 13840384. Throughput: 0: 1639.0, 1: 1184.7. Samples: 3457470. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:12,459][109198] Avg episode reward: [(0, '-1.663'), (1, '-3.357')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:13,723][63733] Updated weights for policy 1, policy_version 1640 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:13,794][63770] DAMAGECOUNT value on done: 11110.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:13,795][63770] Sum rewards: 1.927, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.650', 'AMMO5': '0.010', 'AMMO2': '0.016', 'weapon4': '0.050', 'AMMO4': '0.080', 'AMMO3': '0.110', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'weapon5': '0.228', 'HITCOUNT': '0.340', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.212', 'weapon2': '1.302', 'weapon3': '2.028', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:13,909][63734] DAMAGECOUNT value on done: 9780.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:14,136][63770] DAMAGECOUNT value on done: 7760.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:14,305][63734] DAMAGECOUNT value on done: 9506.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:14,305][63734] Sum rewards: -4.681, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.607', 'AMMO2': '0.014', 'AMMO5': '0.018', 'ARMOR': '0.028', 'weapon5': '0.034', 'WEAPON4': '0.050', 'AMMO4': '0.072', 'weapon4': '0.116', 'AMMO3': '0.194', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.612', 'WEAPON3': '1.100', 'weapon2': '1.444', 'weapon3': '2.084', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:14,914][63767] DAMAGECOUNT value on done: 10734.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:14,914][63767] Sum rewards: 0.014, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.794', 'AMMO2': '0.002', 'AMMO4': '0.009', 'AMMO5': '0.013', 'ARMOR': '0.080', 'AMMO3': '0.084', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.120', 'weapon5': '0.124', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'weapon4': '0.308', 'HITCOUNT': '0.330', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.116', 'weapon2': '1.212', 'weapon3': '1.710', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:15,287][63767] DAMAGECOUNT value on done: 9859.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:15,288][63767] Sum rewards: -4.166, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.625', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.010', 'AMMO2': '0.023', 'WEAPON1': '0.030', 'ARMOR': '0.056', 'AMMO4': '0.117', 'AMMO3': '0.138', 'weapon5': '0.150', 'WEAPON5': '0.200', 'weapon4': '0.238', 'WEAPON4': '0.250', 'HITCOUNT': '0.320', 'WEAPON3': '0.850', 'weapon2': '0.966', 'DAMAGECOUNT': '1.125', 'weapon3': '2.236'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:15,480][63735] DAMAGECOUNT value on done: 9092.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:15,555][63805] DAMAGECOUNT value on done: 11093.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:15,556][63805] Sum rewards: -2.355, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.052', 'AMMO5': '0.003', 'ARMOR': '0.004', 'WEAPON1': '0.010', 'weapon5': '0.022', 'AMMO2': '0.030', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'AMMO3': '0.122', 'AMMO4': '0.149', 'weapon4': '0.152', 'HITCOUNT': '0.270', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.930', 'FRAGCOUNT': '1.000', 'weapon2': '1.610', 'weapon3': '1.796'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:15,866][63805] DAMAGECOUNT value on done: 8098.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:15,866][63805] Sum rewards: -1.402, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.438', 'AMMO5': '0.003', 'AMMO2': '0.021', 'WEAPON5': '0.050', 'HITCOUNT': '0.080', 'AMMO3': '0.087', 'ARMOR': '0.088', 'AMMO4': '0.105', 'WEAPON4': '0.200', 'weapon4': '0.368', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon3': '1.150', 'weapon2': '1.764'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:15,882][63735] DAMAGECOUNT value on done: 10966.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:15,882][63735] Sum rewards: -5.230, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.147', 'AMMO5': '0.015', 'AMMO2': '0.019', 'ARMOR': '0.024', 'AMMO4': '0.094', 'weapon4': '0.128', 'AMMO3': '0.143', 'HITCOUNT': '0.180', 'weapon5': '0.186', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon7': '0.234', 'AMMO6': '0.300', 'WEAPON7': '0.300', 'AMMO7': '0.300', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.738', 'FRAGCOUNT': '1.000', 'weapon3': '1.568', 'weapon2': '1.638'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:16,130][63769] DAMAGECOUNT value on done: 10022.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:16,131][63769] Sum rewards: -2.568, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.120', 'AMMO5': '0.013', 'weapon5': '0.014', 'AMMO2': '0.018', 'ARMOR': '0.052', 'AMMO4': '0.090', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.171', 'weapon4': '0.302', 'HITCOUNT': '0.380', 'WEAPON3': '1.050', 'weapon2': '1.212', 'DAMAGECOUNT': '1.620', 'weapon3': '1.930', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:16,542][63769] DAMAGECOUNT value on done: 9242.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:16,934][63735] DAMAGECOUNT value on done: 9426.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:16,934][63735] Sum rewards: -0.652, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.090', 'AMMO5': '0.015', 'ARMOR': '0.036', 'AMMO2': '0.040', 'AMMO3': '0.093', 'AMMO4': '0.198', 'WEAPON5': '0.250', 'weapon5': '0.266', 'HITCOUNT': '0.370', 'WEAPON4': '0.450', 'WEAPON3': '0.450', 'weapon4': '0.570', 'DAMAGECOUNT': '1.062', 'weapon3': '1.190', 'weapon2': '1.448', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:16,935][63806] DAMAGECOUNT value on done: 8172.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:16,936][63806] Sum rewards: -1.257, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.915', 'AMMO5': '0.026', 'AMMO2': '0.030', 'ARMOR': '0.060', 'AMMO3': '0.113', 'AMMO4': '0.148', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'weapon4': '0.428', 'WEAPON5': '0.500', 'weapon5': '0.578', 'WEAPON3': '0.750', 'weapon3': '1.250', 'weapon2': '1.494', 'DAMAGECOUNT': '1.611', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:16,987][63734] DAMAGECOUNT value on done: 9335.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:16,987][63734] Sum rewards: -7.574, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-4.260', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'AMMO2': '0.035', 'weapon5': '0.068', 'ARMOR': '0.092', 'WEAPON5': '0.100', 'AMMO3': '0.145', 'AMMO4': '0.172', 'HITCOUNT': '0.320', 'weapon4': '0.322', 'WEAPON4': '0.500', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.185', 'weapon2': '1.544', 'weapon3': '1.878', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:17,314][63735] DAMAGECOUNT value on done: 7505.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:17,314][63735] Sum rewards: 0.684, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.725', 'AMMO2': '0.003', 'AMMO5': '0.007', 'AMMO4': '0.016', 'weapon5': '0.022', 'AMMO3': '0.109', 'WEAPON5': '0.150', 'weapon4': '0.186', 'WEAPON4': '0.250', 'ARMOR': '0.465', 'HITCOUNT': '0.490', 'WEAPON3': '0.750', 'weapon3': '1.714', 'DAMAGECOUNT': '1.740', 'weapon2': '1.756', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:17,324][63806] DAMAGECOUNT value on done: 9667.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:17,337][63734] DAMAGECOUNT value on done: 7325.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:17,338][63734] Sum rewards: -1.173, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.842', 'AMMO5': '0.010', 'AMMO2': '0.018', 'weapon5': '0.026', 'AMMO4': '0.089', 'AMMO3': '0.138', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.462', 'ARMOR': '0.504', 'DAMAGECOUNT': '0.600', 'weapon2': '0.692', 'WEAPON3': '0.900', 'weapon3': '1.900', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:17,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11127.5, 300 sec: 11357.7). Total num frames: 13897728. Throughput: 0: 1660.8, 1: 1172.9. Samples: 3466033. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:17,460][109198] Avg episode reward: [(0, '-1.764'), (1, '-3.421')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:17,605][63732] Updated weights for policy 0, policy_version 1750 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:21,463][63733] Updated weights for policy 1, policy_version 1650 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:22,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11264.0, 300 sec: 11371.6). Total num frames: 13955072. Throughput: 0: 1651.5, 1: 1183.1. Samples: 3483182. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:22,460][109198] Avg episode reward: [(0, '-1.764'), (1, '-3.421')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:23,099][63771] DAMAGECOUNT value on done: 7980.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:23,100][63771] Sum rewards: -1.578, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.150', 'WEAPON1': '0.010', 'AMMO2': '0.019', 'AMMO5': '0.019', 'AMMO4': '0.094', 'AMMO3': '0.134', 'weapon4': '0.204', 'HITCOUNT': '0.250', 'WEAPON4': '0.300', 'WEAPON5': '0.350', 'weapon5': '0.426', 'WEAPON3': '0.700', 'weapon2': '1.330', 'FRAGCOUNT': '1.500', 'DAMAGECOUNT': '1.578', 'weapon3': '1.658'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:23,436][63769] DAMAGECOUNT value on done: 10311.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:23,436][63769] Sum rewards: 2.870, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.070', 'AMMO2': '0.012', 'ARMOR': '0.054', 'AMMO4': '0.057', 'weapon7': '0.070', 'AMMO3': '0.115', 'WEAPON4': '0.200', 'weapon4': '0.220', 'AMMO6': '0.300', 'WEAPON7': '0.300', 'AMMO7': '0.300', 'HITCOUNT': '0.330', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.602', 'weapon3': '1.712', 'weapon2': '1.718', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:23,488][63771] DAMAGECOUNT value on done: 10374.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:23,489][63771] Sum rewards: 1.157, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.307', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.007', 'AMMO3': '0.092', 'weapon5': '0.120', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'WEAPON3': '0.350', 'ARMOR': '0.420', 'DAMAGECOUNT': '0.669', 'weapon3': '1.534', 'weapon2': '1.966', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:23,761][63767] DAMAGECOUNT value on done: 11259.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:23,762][63767] Sum rewards: -3.560, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.266', 'WEAPON1': '0.010', 'AMMO2': '0.022', 'AMMO5': '0.025', 'AMMO3': '0.089', 'ARMOR': '0.106', 'AMMO4': '0.108', 'weapon5': '0.154', 'HITCOUNT': '0.210', 'WEAPON4': '0.300', 'WEAPON5': '0.350', 'FRAGCOUNT': '0.500', 'weapon4': '0.508', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.050', 'weapon2': '1.306', 'weapon3': '1.368'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:23,814][63769] DAMAGECOUNT value on done: 7475.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:24,144][63767] DAMAGECOUNT value on done: 13054.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:24,144][63767] Sum rewards: -0.961, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.442', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.048', 'weapon7': '0.060', 'ARMOR': '0.092', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.151', 'WEAPON7': '0.200', 'WEAPON4': '0.250', 'HITCOUNT': '0.440', 'weapon4': '0.492', 'WEAPON3': '0.800', 'weapon2': '0.842', 'weapon3': '1.436', 'DAMAGECOUNT': '1.665', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:24,886][63732] Updated weights for policy 0, policy_version 1760 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:25,393][63770] DAMAGECOUNT value on done: 8683.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:25,394][63770] Sum rewards: 2.286, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.615', 'AMMO5': '0.003', 'AMMO2': '0.009', 'AMMO3': '0.040', 'AMMO4': '0.043', 'WEAPON5': '0.050', 'weapon5': '0.060', 'HITCOUNT': '0.200', 'WEAPON4': '0.250', 'WEAPON3': '0.250', 'weapon4': '0.466', 'DAMAGECOUNT': '0.579', 'ARMOR': '0.580', 'weapon3': '0.802', 'weapon2': '1.070', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:25,757][63770] DAMAGECOUNT value on done: 8379.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:25,758][63770] Sum rewards: -2.863, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.558', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO2': '0.007', 'ARMOR': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.033', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.124', 'AMMO3': '0.141', 'HITCOUNT': '0.220', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.807', 'weapon2': '1.702', 'weapon3': '1.768', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:26,055][63806] DAMAGECOUNT value on done: 9737.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:26,356][63806] DAMAGECOUNT value on done: 9100.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:27,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11332.3, 300 sec: 11371.6). Total num frames: 14012416. Throughput: 0: 1623.8, 1: 1204.7. Samples: 3500078. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:27,460][109198] Avg episode reward: [(0, '-1.677'), (1, '-3.320')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:28,128][63805] DAMAGECOUNT value on done: 10537.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:28,519][63805] DAMAGECOUNT value on done: 11289.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:28,519][63805] Sum rewards: -0.565, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.406', 'WEAPON1': '0.010', 'AMMO2': '0.019', 'AMMO5': '0.026', 'ARMOR': '0.072', 'AMMO4': '0.096', 'AMMO3': '0.110', 'WEAPON4': '0.250', 'HITCOUNT': '0.250', 'weapon4': '0.412', 'weapon5': '0.444', 'WEAPON5': '0.450', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.600', 'weapon3': '1.248', 'DAMAGECOUNT': '1.353', 'weapon2': '1.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:28,636][63733] Updated weights for policy 1, policy_version 1660 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:29,103][63771] DAMAGECOUNT value on done: 10532.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:29,529][63771] DAMAGECOUNT value on done: 7732.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:29,530][63771] Sum rewards: -1.461, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.356', 'AMMO2': '0.004', 'AMMO5': '0.014', 'WEAPON1': '0.020', 'AMMO4': '0.020', 'WEAPON4': '0.050', 'HITCOUNT': '0.080', 'AMMO3': '0.090', 'weapon4': '0.146', 'weapon5': '0.152', 'WEAPON3': '0.300', 'WEAPON5': '0.300', 'weapon3': '0.314', 'DAMAGECOUNT': '0.432', 'ARMOR': '0.940', 'FRAGCOUNT': '2.000', 'weapon2': '2.532'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:32,052][63732] Updated weights for policy 0, policy_version 1770 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:32,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11400.5, 300 sec: 11385.5). Total num frames: 14069760. Throughput: 0: 1612.3, 1: 1215.9. Samples: 3508680. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:32,460][109198] Avg episode reward: [(0, '-1.688'), (1, '-3.341')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:35,985][63733] Updated weights for policy 1, policy_version 1670 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:37,203][63734] DAMAGECOUNT value on done: 9977.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:37,204][63734] Sum rewards: -1.565, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.370', 'AMMO4': '-0.004', 'AMMO2': '-0.001', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'WEAPON5': '0.050', 'weapon4': '0.062', 'weapon5': '0.072', 'AMMO3': '0.088', 'WEAPON4': '0.100', 'HITCOUNT': '0.180', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.591', 'FRAGCOUNT': '1.000', 'weapon3': '1.096', 'weapon2': '2.098'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:37,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11264.0, 300 sec: 11385.5). Total num frames: 14123008. Throughput: 0: 1585.6, 1: 1235.1. Samples: 3525412. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:37,460][109198] Avg episode reward: [(0, '-1.688'), (1, '-3.306')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:37,509][63767] DAMAGECOUNT value on done: 10841.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:37,618][63734] DAMAGECOUNT value on done: 9750.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:37,618][63734] Sum rewards: -7.249, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.562', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.014', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'AMMO4': '0.070', 'weapon5': '0.072', 'AMMO3': '0.080', 'weapon4': '0.098', 'HITCOUNT': '0.170', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.450', 'ARMOR': '0.534', 'DAMAGECOUNT': '0.732', 'weapon3': '1.314', 'weapon2': '1.990'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:37,836][63767] DAMAGECOUNT value on done: 10299.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:37,836][63767] Sum rewards: -2.972, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.572', 'AMMO2': '0.008', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.028', 'AMMO4': '0.042', 'weapon7': '0.090', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon5': '0.112', 'AMMO3': '0.152', 'WEAPON5': '0.250', 'HITCOUNT': '0.320', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.850', 'weapon2': '1.212', 'DAMAGECOUNT': '1.320', 'weapon3': '2.128'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:38,401][63805] DAMAGECOUNT value on done: 11134.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:38,402][63805] Sum rewards: -4.335, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.195', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'weapon5': '0.038', 'HITCOUNT': '0.040', 'ARMOR': '0.088', 'weapon4': '0.098', 'DAMAGECOUNT': '0.123', 'AMMO3': '0.132', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.642', 'weapon2': '1.770'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:38,739][63805] DAMAGECOUNT value on done: 8513.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:38,739][63805] Sum rewards: 1.364, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.670', 'AMMO2': '0.004', 'AMMO5': '0.010', 'AMMO4': '0.019', 'WEAPON1': '0.020', 'ARMOR': '0.060', 'AMMO3': '0.068', 'weapon5': '0.078', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'HITCOUNT': '0.310', 'weapon4': '0.318', 'WEAPON3': '0.450', 'DAMAGECOUNT': '1.245', 'weapon3': '1.286', 'weapon2': '1.966', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:39,355][63732] Updated weights for policy 0, policy_version 1780 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:39,442][63770] DAMAGECOUNT value on done: 11393.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:39,443][63770] Sum rewards: -1.901, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.370', 'AMMO2': '0.007', 'AMMO5': '0.015', 'WEAPON1': '0.030', 'AMMO4': '0.032', 'AMMO3': '0.104', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'weapon5': '0.328', 'ARMOR': '0.460', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.849', 'weapon3': '1.560', 'weapon2': '1.694'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:39,565][63769] DAMAGECOUNT value on done: 10216.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:39,565][63769] Sum rewards: -2.864, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.800', 'AMMO2': '0.006', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.029', 'WEAPON4': '0.100', 'AMMO3': '0.109', 'weapon4': '0.110', 'weapon5': '0.112', 'WEAPON5': '0.150', 'HITCOUNT': '0.210', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.582', 'FRAGCOUNT': '1.000', 'weapon3': '1.138', 'weapon2': '2.062'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:39,826][63770] DAMAGECOUNT value on done: 7960.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:39,827][63770] Sum rewards: -2.257, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.802', 'AMMO5': '0.013', 'AMMO2': '0.013', 'WEAPON1': '0.030', 'AMMO4': '0.062', 'ARMOR': '0.078', 'AMMO3': '0.083', 'HITCOUNT': '0.150', 'weapon5': '0.162', 'weapon4': '0.196', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.182', 'weapon2': '1.626'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:39,941][63769] DAMAGECOUNT value on done: 9502.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:39,941][63769] Sum rewards: -4.631, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.452', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'weapon5': '0.014', 'AMMO2': '0.026', 'WEAPON5': '0.050', 'ARMOR': '0.068', 'AMMO4': '0.131', 'AMMO3': '0.147', 'weapon4': '0.234', 'HITCOUNT': '0.260', 'WEAPON4': '0.350', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.780', 'weapon2': '1.586', 'weapon3': '1.662'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:40,355][63734] DAMAGECOUNT value on done: 9802.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:40,355][63734] Sum rewards: -3.063, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.982', 'AMMO5': '0.010', 'ARMOR': '0.028', 'AMMO2': '0.033', 'AMMO3': '0.129', 'AMMO4': '0.165', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'weapon4': '0.328', 'HITCOUNT': '0.340', 'weapon5': '0.474', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.750', 'weapon2': '1.384', 'DAMAGECOUNT': '1.401', 'weapon3': '1.576'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:40,512][63735] DAMAGECOUNT value on done: 9347.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:40,513][63735] Sum rewards: -1.275, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.235', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.013', 'weapon5': '0.026', 'WEAPON1': '0.030', 'AMMO3': '0.078', 'ARMOR': '0.092', 'WEAPON4': '0.100', 'HITCOUNT': '0.160', 'weapon4': '0.166', 'WEAPON5': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.765', 'weapon3': '1.508', 'weapon2': '1.736', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:40,672][63734] DAMAGECOUNT value on done: 7595.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:40,673][63734] Sum rewards: -2.166, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.360', 'AMMO2': '0.005', 'AMMO5': '0.013', 'AMMO4': '0.025', 'ARMOR': '0.072', 'AMMO3': '0.140', 'weapon5': '0.154', 'weapon4': '0.226', 'WEAPON4': '0.250', 'HITCOUNT': '0.280', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.810', 'WEAPON3': '0.950', 'weapon2': '1.564', 'weapon3': '1.654', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:40,892][63735] DAMAGECOUNT value on done: 11367.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:40,892][63735] Sum rewards: 0.172, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.130', 'AMMO2': '0.010', 'AMMO5': '0.015', 'AMMO4': '0.052', 'AMMO3': '0.094', 'weapon5': '0.100', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'weapon4': '0.308', 'HITCOUNT': '0.410', 'ARMOR': '0.432', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.203', 'weapon2': '1.606', 'weapon3': '1.772'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:41,941][63806] DAMAGECOUNT value on done: 8186.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:42,036][63735] DAMAGECOUNT value on done: 9823.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:42,037][63735] Sum rewards: -1.371, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.758', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'AMMO2': '0.021', 'ARMOR': '0.048', 'AMMO3': '0.099', 'AMMO4': '0.104', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'weapon5': '0.378', 'weapon4': '0.454', 'WEAPON3': '0.550', 'weapon2': '1.030', 'DAMAGECOUNT': '1.191', 'weapon3': '1.714', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:42,329][63806] DAMAGECOUNT value on done: 10113.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:42,329][63806] Sum rewards: -0.974, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.290', 'weapon5': '0.002', 'AMMO5': '0.010', 'ARMOR': '0.012', 'AMMO2': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.073', 'AMMO3': '0.104', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.208', 'HITCOUNT': '0.310', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.338', 'weapon2': '1.606', 'weapon3': '1.768', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:42,449][63735] DAMAGECOUNT value on done: 7966.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:42,450][63735] Sum rewards: -0.183, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.244', 'AMMO2': '0.011', 'AMMO5': '0.013', 'ARMOR': '0.028', 'WEAPON1': '0.040', 'AMMO4': '0.056', 'weapon5': '0.084', 'WEAPON4': '0.100', 'AMMO3': '0.121', 'HITCOUNT': '0.230', 'WEAPON5': '0.300', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.380', 'weapon2': '1.534', 'weapon3': '1.814', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:42,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11264.0, 300 sec: 11385.5). Total num frames: 14180352. Throughput: 0: 1547.0, 1: 1273.0. Samples: 3542311. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:42,460][109198] Avg episode reward: [(0, '-1.781'), (1, '-3.177')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:43,289][63733] Updated weights for policy 1, policy_version 1680 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:46,237][63771] DAMAGECOUNT value on done: 8687.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:46,238][63771] Sum rewards: -3.165, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.444', 'AMMO2': '0.015', 'ARMOR': '0.028', 'WEAPON1': '0.030', 'AMMO5': '0.035', 'WEAPON4': '0.050', 'AMMO4': '0.074', 'AMMO3': '0.130', 'weapon4': '0.150', 'weapon5': '0.248', 'HITCOUNT': '0.450', 'WEAPON5': '0.550', 'WEAPON3': '0.750', 'weapon2': '1.330', 'FRAGCOUNT': '1.500', 'weapon3': '1.818', 'DAMAGECOUNT': '2.121'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:46,320][63767] DAMAGECOUNT value on done: 11513.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:46,321][63767] Sum rewards: 1.427, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.015', 'AMMO2': '0.023', 'WEAPON4': '0.050', 'weapon7': '0.058', 'AMMO3': '0.100', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'weapon4': '0.102', 'AMMO4': '0.115', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'weapon5': '0.300', 'ARMOR': '0.408', 'WEAPON3': '0.550', 'HEALTH': '0.578', 'DAMAGECOUNT': '0.762', 'weapon2': '1.434', 'weapon3': '1.662', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:46,585][63732] Updated weights for policy 0, policy_version 1790 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:46,603][63771] DAMAGECOUNT value on done: 11057.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:46,603][63771] Sum rewards: 0.437, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.764', 'AMMO2': '0.008', 'WEAPON1': '0.020', 'AMMO5': '0.030', 'AMMO4': '0.040', 'AMMO3': '0.166', 'weapon5': '0.354', 'ARMOR': '0.400', 'WEAPON5': '0.500', 'HITCOUNT': '0.510', 'WEAPON3': '0.850', 'weapon2': '1.188', 'DAMAGECOUNT': '2.049', 'weapon3': '2.086', 'FRAGCOUNT': '3.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:46,687][63767] DAMAGECOUNT value on done: 13472.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:46,688][63767] Sum rewards: 1.548, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.406', 'AMMO5': '0.015', 'weapon7': '0.024', 'AMMO2': '0.028', 'ARMOR': '0.072', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.114', 'AMMO4': '0.140', 'weapon5': '0.150', 'WEAPON4': '0.250', 'WEAPON5': '0.250', 'weapon4': '0.286', 'HITCOUNT': '0.350', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.254', 'weapon2': '1.572', 'weapon3': '1.648', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:47,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11332.3, 300 sec: 11385.5). Total num frames: 14237696. Throughput: 0: 1528.2, 1: 1297.2. Samples: 3550748. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:47,460][109198] Avg episode reward: [(0, '-1.784'), (1, '-3.106')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:48,921][63769] DAMAGECOUNT value on done: 10580.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:48,922][63769] Sum rewards: -3.035, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.162', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.001', 'AMMO4': '0.005', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'WEAPON4': '0.150', 'AMMO3': '0.151', 'HITCOUNT': '0.160', 'weapon4': '0.214', 'weapon5': '0.300', 'WEAPON5': '0.400', 'ARMOR': '0.516', 'weapon2': '0.592', 'DAMAGECOUNT': '0.807', 'WEAPON3': '0.850', 'weapon3': '2.192'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:49,068][63806] DAMAGECOUNT value on done: 9886.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:49,068][63806] Sum rewards: -5.953, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.110', 'AMMO5': '0.003', 'AMMO2': '0.020', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'WEAPON5': '0.050', 'AMMO4': '0.098', 'AMMO3': '0.138', 'HITCOUNT': '0.150', 'weapon4': '0.244', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.447', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.494', 'weapon3': '1.812'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:49,313][63769] DAMAGECOUNT value on done: 7650.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:49,314][63769] Sum rewards: -3.527, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.226', 'AMMO5': '0.005', 'AMMO2': '0.021', 'AMMO3': '0.080', 'ARMOR': '0.092', 'weapon5': '0.094', 'WEAPON5': '0.100', 'AMMO4': '0.105', 'weapon4': '0.128', 'HITCOUNT': '0.150', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.525', 'weapon3': '1.282', 'FRAGCOUNT': '2.000', 'weapon2': '2.016'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:49,393][63806] DAMAGECOUNT value on done: 9360.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:49,394][63806] Sum rewards: -3.098, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.100', 'AMMO5': '0.007', 'AMMO2': '0.023', 'ARMOR': '0.048', 'weapon5': '0.056', 'AMMO3': '0.091', 'WEAPON4': '0.100', 'AMMO4': '0.116', 'WEAPON5': '0.150', 'HITCOUNT': '0.230', 'weapon4': '0.294', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.780', 'weapon3': '1.568', 'weapon2': '1.688', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:50,396][63733] Updated weights for policy 1, policy_version 1690 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:50,977][63805] DAMAGECOUNT value on done: 10671.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:50,978][63805] Sum rewards: -0.488, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.190', 'AMMO4': '-0.036', 'AMMO2': '-0.007', 'AMMO5': '0.007', 'HITCOUNT': '0.060', 'AMMO3': '0.070', 'ARMOR': '0.072', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon5': '0.134', 'weapon7': '0.146', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.402', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.194', 'weapon2': '1.910'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:51,234][63770] DAMAGECOUNT value on done: 8883.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:51,323][63805] DAMAGECOUNT value on done: 11697.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:51,324][63805] Sum rewards: -0.251, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.713', 'AMMO2': '0.009', 'AMMO5': '0.020', 'AMMO4': '0.047', 'AMMO3': '0.107', 'weapon7': '0.190', 'HITCOUNT': '0.200', 'AMMO6': '0.220', 'AMMO7': '0.220', 'WEAPON5': '0.250', 'weapon5': '0.286', 'WEAPON7': '0.300', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.224', 'weapon2': '1.552', 'weapon3': '1.736'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:51,628][63770] DAMAGECOUNT value on done: 8934.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:51,629][63770] Sum rewards: 4.116, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.152', 'AMMO5': '0.010', 'AMMO2': '0.021', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'AMMO4': '0.104', 'AMMO3': '0.166', 'weapon4': '0.212', 'weapon5': '0.222', 'HITCOUNT': '0.430', 'ARMOR': '0.848', 'weapon2': '0.862', 'WEAPON3': '0.950', 'DAMAGECOUNT': '1.665', 'weapon3': '1.878', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:52,026][63771] DAMAGECOUNT value on done: 10797.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:52,342][63771] DAMAGECOUNT value on done: 8057.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:52,343][63771] Sum rewards: -7.340, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.901', 'AMMO5': '0.005', 'AMMO2': '0.013', 'WEAPON1': '0.050', 'AMMO4': '0.067', 'WEAPON5': '0.100', 'AMMO3': '0.177', 'HITCOUNT': '0.260', 'DAMAGECOUNT': '0.975', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.100', 'weapon2': '1.614', 'weapon3': '1.950'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:52,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11332.3, 300 sec: 11385.5). Total num frames: 14295040. Throughput: 0: 1487.6, 1: 1344.2. Samples: 3567860. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:52,459][109198] Avg episode reward: [(0, '-1.672'), (1, '-3.217')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:53,695][63732] Updated weights for policy 0, policy_version 1800 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:57,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11332.3, 300 sec: 11399.4). Total num frames: 14352384. Throughput: 0: 1443.9, 1: 1389.4. Samples: 3584968. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:57:57,460][109198] Avg episode reward: [(0, '-1.672'), (1, '-3.217')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:57,666][63733] Updated weights for policy 1, policy_version 1700 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:59,837][63767] DAMAGECOUNT value on done: 11276.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:57:59,837][63767] Sum rewards: -2.091, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.568', 'AMMO2': '0.021', 'AMMO5': '0.023', 'ARMOR': '0.044', 'weapon5': '0.066', 'AMMO4': '0.106', 'AMMO3': '0.178', 'HITCOUNT': '0.380', 'WEAPON4': '0.400', 'WEAPON5': '0.400', 'weapon4': '0.484', 'WEAPON3': '1.150', 'weapon2': '1.158', 'DAMAGECOUNT': '1.305', 'weapon3': '2.012', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:00,221][63767] DAMAGECOUNT value on done: 10509.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:00,222][63767] Sum rewards: -4.359, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.148', 'AMMO2': '0.012', 'AMMO5': '0.015', 'weapon5': '0.028', 'ARMOR': '0.040', 'AMMO4': '0.061', 'weapon4': '0.086', 'WEAPON4': '0.100', 'AMMO3': '0.141', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.750', 'weapon3': '1.706', 'weapon2': '1.850', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:00,231][63734] DAMAGECOUNT value on done: 10247.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:00,232][63734] Sum rewards: -4.171, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.658', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.010', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'weapon5': '0.032', 'AMMO4': '0.051', 'ARMOR': '0.060', 'WEAPON4': '0.150', 'AMMO3': '0.156', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'weapon4': '0.288', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.810', 'weapon2': '1.090', 'weapon3': '1.624'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:00,560][63734] DAMAGECOUNT value on done: 9933.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:00,560][63734] Sum rewards: -7.336, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-3.058', 'AMMO5': '0.005', 'AMMO2': '0.021', 'weapon5': '0.032', 'ARMOR': '0.036', 'WEAPON5': '0.100', 'AMMO4': '0.105', 'AMMO3': '0.133', 'HITCOUNT': '0.180', 'weapon4': '0.182', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.549', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.384', 'weapon3': '2.044'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:00,932][63732] Updated weights for policy 0, policy_version 1810 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:01,339][63805] DAMAGECOUNT value on done: 11523.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:01,339][63805] Sum rewards: -2.501, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.646', 'AMMO4': '-0.064', 'AMMO2': '-0.013', 'AMMO5': '0.016', 'WEAPON1': '0.020', 'ARMOR': '0.068', 'weapon5': '0.116', 'AMMO3': '0.140', 'WEAPON5': '0.200', 'HITCOUNT': '0.330', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.167', 'weapon2': '1.550', 'weapon3': '1.864', 'FRAGCOUNT': '3.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:01,724][63805] DAMAGECOUNT value on done: 8887.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:01,724][63805] Sum rewards: -7.069, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.548', 'AMMO5': '0.007', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'AMMO4': '0.038', 'WEAPON5': '0.050', 'ARMOR': '0.096', 'AMMO3': '0.154', 'HITCOUNT': '0.360', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.122', 'weapon3': '1.718', 'weapon2': '1.816'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:02,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11332.3, 300 sec: 11399.4). Total num frames: 14409728. Throughput: 0: 1424.3, 1: 1404.4. Samples: 3593324. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:02,460][109198] Avg episode reward: [(0, '-1.629'), (1, '-3.423')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:03,088][63769] DAMAGECOUNT value on done: 10281.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:03,414][63734] DAMAGECOUNT value on done: 9937.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:03,415][63734] Sum rewards: 0.282, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.050', 'AMMO2': '0.005', 'WEAPON1': '0.020', 'AMMO5': '0.020', 'AMMO4': '0.022', 'ARMOR': '0.074', 'WEAPON4': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.142', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.405', 'weapon5': '0.416', 'WEAPON3': '0.750', 'weapon2': '1.284', 'weapon3': '1.754', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:03,418][63769] DAMAGECOUNT value on done: 9788.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:03,419][63769] Sum rewards: 0.799, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.718', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.019', 'AMMO3': '0.125', 'HITCOUNT': '0.140', 'WEAPON5': '0.250', 'weapon5': '0.264', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.858', 'weapon3': '1.374', 'weapon2': '1.710', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:03,749][63734] DAMAGECOUNT value on done: 8073.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:03,749][63734] Sum rewards: -1.559, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.886', 'AMMO5': '0.010', 'AMMO2': '0.014', 'AMMO4': '0.070', 'WEAPON4': '0.100', 'weapon5': '0.102', 'AMMO3': '0.134', 'WEAPON5': '0.200', 'weapon4': '0.254', 'HITCOUNT': '0.330', 'ARMOR': '0.408', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.434', 'FRAGCOUNT': '1.500', 'weapon2': '1.592', 'weapon3': '1.628'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:05,020][63733] Updated weights for policy 1, policy_version 1710 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:05,215][63770] DAMAGECOUNT value on done: 11553.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:05,216][63770] Sum rewards: -7.476, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.040', 'WEAPON1': '0.010', 'AMMO2': '0.016', 'AMMO5': '0.025', 'ARMOR': '0.032', 'AMMO4': '0.079', 'AMMO3': '0.168', 'HITCOUNT': '0.170', 'WEAPON4': '0.250', 'weapon5': '0.278', 'weapon4': '0.352', 'DAMAGECOUNT': '0.480', 'WEAPON5': '0.500', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '1.362', 'weapon2': '1.642'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:05,455][63735] DAMAGECOUNT value on done: 9362.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:05,577][63770] DAMAGECOUNT value on done: 8044.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:05,578][63770] Sum rewards: 0.439, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.989', 'AMMO2': '0.005', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.026', 'ARMOR': '0.068', 'AMMO3': '0.079', 'HITCOUNT': '0.080', 'weapon5': '0.114', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.252', 'WEAPON3': '0.550', 'weapon3': '1.358', 'weapon2': '1.968', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:05,815][63735] DAMAGECOUNT value on done: 11472.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:05,815][63735] Sum rewards: -1.561, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.110', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.020', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.075', 'AMMO4': '0.098', 'weapon5': '0.174', 'AMMO6': '0.200', 'AMMO7': '0.200', 'WEAPON7': '0.200', 'weapon7': '0.250', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.400', 'weapon3': '0.944', 'FRAGCOUNT': '1.000', 'weapon2': '1.258'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:06,826][63806] DAMAGECOUNT value on done: 8495.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:06,826][63806] Sum rewards: 0.075, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.717', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'AMMO2': '0.022', 'ARMOR': '0.024', 'weapon7': '0.094', 'AMMO4': '0.112', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.124', 'WEAPON7': '0.200', 'weapon5': '0.230', 'HITCOUNT': '0.270', 'WEAPON5': '0.300', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.927', 'weapon2': '1.336', 'weapon3': '2.130', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:06,913][63735] DAMAGECOUNT value on done: 10083.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:06,913][63735] Sum rewards: -1.707, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.496', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'ARMOR': '0.032', 'WEAPON5': '0.050', 'AMMO4': '0.057', 'weapon5': '0.122', 'AMMO3': '0.164', 'HITCOUNT': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.780', 'weapon2': '1.432', 'weapon3': '2.078', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:07,213][63806] DAMAGECOUNT value on done: 10233.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:07,388][63735] DAMAGECOUNT value on done: 8039.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:07,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11400.5, 300 sec: 11399.4). Total num frames: 14467072. Throughput: 0: 1416.6, 1: 1409.6. Samples: 3610363. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:07,460][109198] Avg episode reward: [(0, '-1.594'), (1, '-3.297')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:08,140][63732] Updated weights for policy 0, policy_version 1820 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:08,622][63767] DAMAGECOUNT value on done: 12028.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:08,623][63767] Sum rewards: 1.619, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.418', 'AMMO2': '0.007', 'AMMO5': '0.007', 'AMMO4': '0.032', 'weapon4': '0.036', 'WEAPON4': '0.100', 'ARMOR': '0.104', 'AMMO3': '0.117', 'WEAPON5': '0.150', 'weapon5': '0.244', 'HITCOUNT': '0.340', 'WEAPON3': '0.800', 'weapon2': '1.160', 'DAMAGECOUNT': '1.545', 'weapon3': '1.894', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:08,999][63767] DAMAGECOUNT value on done: 13682.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:09,000][63767] Sum rewards: -1.119, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.736', 'AMMO2': '0.003', 'AMMO4': '0.016', 'AMMO3': '0.140', 'HITCOUNT': '0.180', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.630', 'weapon2': '1.372', 'weapon3': '1.426', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:09,073][63771] DAMAGECOUNT value on done: 8975.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:09,074][63771] Sum rewards: -2.196, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.858', 'AMMO2': '0.019', 'AMMO5': '0.020', 'WEAPON4': '0.050', 'weapon4': '0.072', 'AMMO4': '0.096', 'AMMO3': '0.140', 'HITCOUNT': '0.230', 'WEAPON5': '0.250', 'ARMOR': '0.416', 'weapon5': '0.426', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.864', 'FRAGCOUNT': '1.000', 'weapon2': '1.546', 'weapon3': '1.732'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:09,419][63771] DAMAGECOUNT value on done: 11487.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:09,420][63771] Sum rewards: 1.211, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.839', 'AMMO5': '0.012', 'AMMO2': '0.029', 'WEAPON4': '0.050', 'AMMO3': '0.140', 'weapon4': '0.146', 'AMMO4': '0.146', 'WEAPON5': '0.250', 'weapon5': '0.262', 'HITCOUNT': '0.320', 'WEAPON3': '0.750', 'ARMOR': '0.800', 'DAMAGECOUNT': '1.290', 'weapon2': '1.440', 'weapon3': '1.664', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:11,970][63806] DAMAGECOUNT value on done: 10156.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:11,971][63806] Sum rewards: -0.506, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.204', 'AMMO5': '0.010', 'AMMO2': '0.010', 'ARMOR': '0.040', 'WEAPON1': '0.040', 'AMMO4': '0.050', 'AMMO3': '0.090', 'weapon5': '0.128', 'WEAPON5': '0.200', 'HITCOUNT': '0.220', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.810', 'weapon3': '1.256', 'weapon2': '1.844', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:12,262][63733] Updated weights for policy 1, policy_version 1720 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:12,358][63806] DAMAGECOUNT value on done: 9820.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:12,358][63806] Sum rewards: -1.146, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.662', 'AMMO5': '0.005', 'AMMO2': '0.012', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.059', 'weapon5': '0.066', 'weapon4': '0.130', 'AMMO3': '0.152', 'HITCOUNT': '0.320', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.380', 'weapon2': '1.474', 'weapon3': '1.768', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:12,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11332.3, 300 sec: 11385.5). Total num frames: 14520320. Throughput: 0: 1419.3, 1: 1408.3. Samples: 3627319. Policy #0 lag: (min: 0.0, avg: 0.3, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:12,459][109198] Avg episode reward: [(0, '-1.556'), (1, '-3.267')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:12,500][63454] Saving new best policy, reward=-1.556!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:13,977][63805] DAMAGECOUNT value on done: 10917.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:13,977][63805] Sum rewards: -0.731, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.752', 'AMMO2': '0.009', 'AMMO5': '0.009', 'AMMO4': '0.042', 'ARMOR': '0.064', 'WEAPON5': '0.150', 'AMMO3': '0.161', 'weapon5': '0.182', 'HITCOUNT': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'DAMAGECOUNT': '0.738', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.346', 'weapon3': '2.270'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:14,361][63805] DAMAGECOUNT value on done: 12235.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:14,362][63805] Sum rewards: 1.472, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.100', 'AMMO4': '-0.019', 'AMMO2': '-0.004', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'weapon5': '0.114', 'AMMO3': '0.131', 'WEAPON5': '0.300', 'HITCOUNT': '0.380', 'WEAPON3': '0.800', 'weapon2': '1.132', 'DAMAGECOUNT': '1.614', 'weapon3': '2.346', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:14,415][63769] DAMAGECOUNT value on done: 10764.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:14,416][63769] Sum rewards: -1.969, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.479', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.008', 'weapon5': '0.062', 'weapon4': '0.098', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'ARMOR': '0.116', 'AMMO3': '0.133', 'HITCOUNT': '0.190', 'DAMAGECOUNT': '0.552', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.530', 'weapon3': '1.582'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:14,840][63769] DAMAGECOUNT value on done: 7837.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:14,840][63769] Sum rewards: -3.457, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.290', 'AMMO2': '0.003', 'AMMO5': '0.005', 'AMMO4': '0.016', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'WEAPON4': '0.100', 'AMMO3': '0.107', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'weapon4': '0.178', 'weapon5': '0.208', 'DAMAGECOUNT': '0.561', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.390', 'weapon3': '1.488'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:14,844][63771] DAMAGECOUNT value on done: 11002.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:14,845][63771] Sum rewards: -1.860, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.752', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'weapon4': '0.030', 'AMMO2': '0.032', 'WEAPON5': '0.050', 'ARMOR': '0.067', 'weapon5': '0.104', 'HITCOUNT': '0.160', 'AMMO4': '0.161', 'AMMO3': '0.164', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.615', 'WEAPON3': '1.000', 'weapon2': '1.484', 'weapon3': '1.762', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:15,224][63771] DAMAGECOUNT value on done: 8247.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:15,225][63771] Sum rewards: -1.602, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.498', 'AMMO2': '0.017', 'AMMO5': '0.018', 'ARMOR': '0.036', 'weapon4': '0.044', 'WEAPON4': '0.050', 'weapon5': '0.086', 'AMMO4': '0.086', 'AMMO3': '0.115', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.700', 'weapon3': '1.382', 'weapon2': '1.662', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:15,338][63732] Updated weights for policy 0, policy_version 1830 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:16,854][63770] DAMAGECOUNT value on done: 9076.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:16,854][63770] Sum rewards: -0.069, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.256', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'AMMO2': '0.022', 'weapon5': '0.068', 'AMMO3': '0.085', 'ARMOR': '0.108', 'AMMO4': '0.108', 'HITCOUNT': '0.130', 'WEAPON4': '0.200', 'weapon4': '0.250', 'WEAPON5': '0.300', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.579', 'FRAGCOUNT': '1.000', 'weapon2': '1.248', 'weapon3': '1.614'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:17,204][63770] DAMAGECOUNT value on done: 9424.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:17,205][63770] Sum rewards: 0.767, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.282', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.035', 'ARMOR': '0.060', 'AMMO3': '0.165', 'WEAPON5': '0.200', 'weapon5': '0.204', 'HITCOUNT': '0.420', 'WEAPON3': '0.850', 'weapon2': '1.140', 'DAMAGECOUNT': '1.470', 'weapon3': '2.476', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:17,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11400.5, 300 sec: 11413.3). Total num frames: 14581760. Throughput: 0: 1420.0, 1: 1407.1. Samples: 3635899. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:17,460][109198] Avg episode reward: [(0, '-1.414'), (1, '-3.215')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:17,469][63454] Saving new best policy, reward=-1.414!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:19,508][63733] Updated weights for policy 1, policy_version 1730 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:22,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11332.3, 300 sec: 11385.5). Total num frames: 14635008. Throughput: 0: 1419.9, 1: 1411.4. Samples: 3652817. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:22,459][109198] Avg episode reward: [(0, '-1.414'), (1, '-3.215')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:22,577][63767] DAMAGECOUNT value on done: 11643.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:22,578][63767] Sum rewards: -7.198, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-0.886', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.022', 'ARMOR': '0.064', 'WEAPON5': '0.150', 'weapon5': '0.184', 'AMMO3': '0.223', 'HITCOUNT': '0.310', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.101', 'weapon2': '1.288', 'WEAPON3': '1.300', 'weapon3': '2.284'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:22,662][63732] Updated weights for policy 0, policy_version 1840 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:22,957][63767] DAMAGECOUNT value on done: 11412.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:22,957][63767] Sum rewards: 6.838, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.557', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'AMMO5': '0.010', 'weapon6': '0.056', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON6': '0.100', 'ARMOR': '0.116', 'AMMO3': '0.135', 'WEAPON5': '0.150', 'weapon5': '0.152', 'HITCOUNT': '0.640', 'WEAPON3': '0.800', 'weapon2': '1.314', 'weapon3': '2.270', 'DAMAGECOUNT': '2.709', 'FRAGCOUNT': '7.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:23,112][63734] DAMAGECOUNT value on done: 10437.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:23,428][63734] DAMAGECOUNT value on done: 10208.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:23,428][63734] Sum rewards: -0.453, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.720', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.015', 'AMMO4': '0.074', 'WEAPON5': '0.100', 'ARMOR': '0.122', 'AMMO3': '0.124', 'WEAPON4': '0.150', 'HITCOUNT': '0.210', 'weapon4': '0.214', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.825', 'FRAGCOUNT': '1.000', 'weapon3': '1.330', 'weapon2': '1.488'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:24,066][63805] DAMAGECOUNT value on done: 11688.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:24,425][63805] DAMAGECOUNT value on done: 9073.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:24,426][63805] Sum rewards: -3.105, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.529', 'AMMO5': '0.010', 'weapon5': '0.012', 'AMMO2': '0.015', 'WEAPON1': '0.040', 'AMMO4': '0.072', 'AMMO3': '0.122', 'weapon4': '0.130', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.558', 'ARMOR': '0.569', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.206', 'weapon2': '1.680'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:26,293][63769] DAMAGECOUNT value on done: 10566.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:26,294][63769] Sum rewards: -1.993, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.182', 'AMMO4': '-0.028', 'AMMO2': '-0.006', 'AMMO5': '0.007', 'weapon5': '0.012', 'WEAPON1': '0.040', 'AMMO3': '0.101', 'WEAPON5': '0.150', 'HITCOUNT': '0.190', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.855', 'weapon3': '1.560', 'weapon2': '1.656', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:26,548][63734] DAMAGECOUNT value on done: 10097.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:26,548][63734] Sum rewards: -4.062, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.720', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'AMMO5': '0.005', 'ARMOR': '0.032', 'HITCOUNT': '0.070', 'weapon7': '0.070', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.141', 'WEAPON5': '0.150', 'weapon5': '0.242', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.500', 'weapon3': '0.692', 'FRAGCOUNT': '1.000', 'weapon2': '2.244'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:26,644][63769] DAMAGECOUNT value on done: 9923.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:26,644][63769] Sum rewards: -5.301, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.179', 'AMMO5': '0.005', 'AMMO2': '0.010', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'weapon5': '0.032', 'AMMO4': '0.051', 'HITCOUNT': '0.080', 'WEAPON5': '0.100', 'AMMO3': '0.146', 'DAMAGECOUNT': '0.405', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.650', 'weapon2': '1.652', 'weapon3': '1.702'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:26,720][63733] Updated weights for policy 1, policy_version 1740 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:26,880][63734] DAMAGECOUNT value on done: 8241.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:26,881][63734] Sum rewards: -1.159, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.336', 'AMMO2': '0.009', 'AMMO5': '0.010', 'AMMO4': '0.045', 'HITCOUNT': '0.120', 'AMMO3': '0.129', 'weapon5': '0.130', 'WEAPON5': '0.200', 'ARMOR': '0.472', 'DAMAGECOUNT': '0.504', 'WEAPON3': '0.900', 'weapon2': '1.400', 'weapon3': '2.258', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:27,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11332.3, 300 sec: 11385.5). Total num frames: 14692352. Throughput: 0: 1417.3, 1: 1413.2. Samples: 3669682. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:27,460][109198] Avg episode reward: [(0, '-1.389'), (1, '-3.019')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:27,465][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001741_7131136.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:27,466][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001846_7561216.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:27,520][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001428_5849088.pth\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:27,526][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001493_6115328.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:27,533][63454] Saving new best policy, reward=-1.389!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:29,915][63732] Updated weights for policy 0, policy_version 1850 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:30,575][63735] DAMAGECOUNT value on done: 9587.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:30,575][63735] Sum rewards: -3.874, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.150', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'ARMOR': '0.028', 'weapon5': '0.046', 'WEAPON5': '0.150', 'AMMO3': '0.171', 'HITCOUNT': '0.180', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.584', 'weapon2': '1.634'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:30,860][63770] DAMAGECOUNT value on done: 11700.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:30,861][63770] Sum rewards: -1.212, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.951', 'AMMO5': '0.005', 'AMMO2': '0.014', 'weapon5': '0.036', 'AMMO4': '0.070', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.110', 'HITCOUNT': '0.130', 'weapon4': '0.182', 'DAMAGECOUNT': '0.441', 'ARMOR': '0.448', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.278', 'weapon3': '1.824'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:31,040][63735] DAMAGECOUNT value on done: 11739.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:31,041][63735] Sum rewards: -0.915, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.106', 'AMMO5': '0.007', 'AMMO2': '0.020', 'WEAPON4': '0.050', 'ARMOR': '0.058', 'AMMO4': '0.098', 'WEAPON5': '0.100', 'weapon5': '0.132', 'AMMO3': '0.146', 'weapon4': '0.208', 'HITCOUNT': '0.230', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.801', 'weapon3': '1.152', 'weapon2': '2.038', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:31,294][63770] DAMAGECOUNT value on done: 8599.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:31,294][63770] Sum rewards: -1.111, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.328', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'AMMO5': '0.023', 'WEAPON1': '0.030', 'weapon5': '0.030', 'ARMOR': '0.064', 'AMMO3': '0.169', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.350', 'HITCOUNT': '0.420', 'WEAPON3': '0.900', 'weapon2': '1.270', 'DAMAGECOUNT': '1.665', 'weapon3': '1.972', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:31,538][63806] DAMAGECOUNT value on done: 8880.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:31,538][63806] Sum rewards: 4.913, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.600', 'AMMO5': '0.010', 'AMMO2': '0.012', 'ARMOR': '0.024', 'weapon5': '0.052', 'AMMO4': '0.059', 'AMMO3': '0.173', 'WEAPON5': '0.200', 'HITCOUNT': '0.280', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.155', 'weapon2': '1.570', 'weapon3': '2.128', 'FRAGCOUNT': '8.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:31,671][63767] DAMAGECOUNT value on done: 12253.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:31,671][63767] Sum rewards: -3.785, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.632', 'AMMO2': '0.015', 'weapon4': '0.058', 'AMMO4': '0.074', 'AMMO3': '0.139', 'WEAPON4': '0.150', 'HITCOUNT': '0.210', 'ARMOR': '0.464', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.860', 'weapon3': '1.902'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:31,939][63806] DAMAGECOUNT value on done: 10350.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:32,054][63767] DAMAGECOUNT value on done: 14298.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:32,054][63767] Sum rewards: 2.401, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.044', 'AMMO2': '0.005', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'AMMO4': '0.027', 'ARMOR': '0.038', 'weapon5': '0.066', 'AMMO3': '0.157', 'WEAPON5': '0.200', 'HITCOUNT': '0.530', 'WEAPON3': '0.950', 'weapon2': '1.388', 'DAMAGECOUNT': '1.848', 'weapon3': '2.210', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:32,154][63771] DAMAGECOUNT value on done: 9390.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:32,155][63771] Sum rewards: 0.697, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.198', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.014', 'weapon7': '0.024', 'ARMOR': '0.028', 'WEAPON4': '0.050', 'AMMO4': '0.068', 'weapon4': '0.084', 'AMMO3': '0.116', 'WEAPON5': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.340', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.245', 'weapon2': '1.704', 'weapon3': '1.904', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:32,230][63735] DAMAGECOUNT value on done: 10468.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:32,230][63735] Sum rewards: 0.447, reward structure: {'DEATHCOUNT': '-8.250', 'weapon4': '0.004', 'AMMO2': '0.011', 'ARMOR': '0.012', 'AMMO5': '0.022', 'AMMO4': '0.056', 'WEAPON4': '0.100', 'AMMO3': '0.123', 'HEALTH': '0.175', 'weapon5': '0.204', 'WEAPON5': '0.350', 'HITCOUNT': '0.360', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.155', 'weapon2': '1.516', 'weapon3': '1.908', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:32,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11264.0, 300 sec: 11371.6). Total num frames: 14745600. Throughput: 0: 1417.2, 1: 1414.1. Samples: 3678158. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:32,460][109198] Avg episode reward: [(0, '-1.286'), (1, '-3.035')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:32,461][63454] Saving new best policy, reward=-1.286!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:32,504][63771] DAMAGECOUNT value on done: 11822.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:32,504][63771] Sum rewards: -3.497, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.677', 'AMMO2': '0.008', 'AMMO5': '0.010', 'ARMOR': '0.016', 'AMMO4': '0.039', 'weapon5': '0.070', 'WEAPON5': '0.150', 'AMMO3': '0.168', 'HITCOUNT': '0.380', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.005', 'weapon2': '1.738', 'weapon3': '2.046'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:32,656][63735] DAMAGECOUNT value on done: 8378.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:32,657][63735] Sum rewards: -3.030, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.561', 'AMMO5': '0.005', 'ARMOR': '0.012', 'AMMO2': '0.015', 'AMMO4': '0.072', 'weapon4': '0.076', 'WEAPON5': '0.100', 'AMMO3': '0.150', 'WEAPON4': '0.200', 'HITCOUNT': '0.270', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.017', 'weapon3': '1.472', 'weapon2': '1.892', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:34,025][63733] Updated weights for policy 1, policy_version 1750 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:34,505][63806] DAMAGECOUNT value on done: 10248.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:34,918][63806] DAMAGECOUNT value on done: 9925.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:36,928][63805] DAMAGECOUNT value on done: 11339.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:36,929][63805] Sum rewards: 4.699, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.962', 'AMMO4': '-0.033', 'AMMO2': '-0.007', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'WEAPON4': '0.050', 'AMMO3': '0.069', 'weapon4': '0.178', 'WEAPON5': '0.300', 'HITCOUNT': '0.420', 'weapon5': '0.462', 'ARMOR': '0.487', 'WEAPON3': '0.500', 'weapon3': '1.244', 'DAMAGECOUNT': '1.266', 'weapon2': '1.700', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:37,166][63732] Updated weights for policy 0, policy_version 1860 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:37,343][63805] DAMAGECOUNT value on done: 12835.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:37,343][63805] Sum rewards: 2.588, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.510', 'AMMO2': '0.005', 'AMMO5': '0.017', 'AMMO4': '0.024', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'AMMO3': '0.133', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.266', 'WEAPON5': '0.350', 'HITCOUNT': '0.440', 'WEAPON3': '0.750', 'weapon3': '1.624', 'weapon2': '1.768', 'DAMAGECOUNT': '1.800', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:37,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11332.3, 300 sec: 11371.6). Total num frames: 14802944. Throughput: 0: 1414.4, 1: 1410.2. Samples: 3694967. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:37,460][109198] Avg episode reward: [(0, '-1.213'), (1, '-3.062')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:37,466][63454] Saving new best policy, reward=-1.213!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:37,864][63771] DAMAGECOUNT value on done: 11192.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:37,865][63771] Sum rewards: 0.664, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.615', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'AMMO3': '0.090', 'ARMOR': '0.092', 'weapon5': '0.094', 'WEAPON5': '0.100', 'HITCOUNT': '0.120', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.570', 'weapon2': '1.076', 'weapon3': '1.196', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:38,216][63771] DAMAGECOUNT value on done: 8257.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:39,937][63769] DAMAGECOUNT value on done: 10909.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:39,938][63769] Sum rewards: -2.006, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.384', 'AMMO2': '0.011', 'AMMO5': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.057', 'ARMOR': '0.069', 'AMMO3': '0.130', 'weapon5': '0.168', 'HITCOUNT': '0.180', 'weapon4': '0.220', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.800', 'weapon2': '0.884', 'FRAGCOUNT': '1.000', 'weapon3': '2.354'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:40,320][63769] DAMAGECOUNT value on done: 7926.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:40,905][63806] Large shaping reward -2.534 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.28500000000000003, -95.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:41,428][63733] Updated weights for policy 1, policy_version 1760 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:42,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11332.3, 300 sec: 11357.7). Total num frames: 14860288. Throughput: 0: 1408.6, 1: 1405.2. Samples: 3711589. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:42,460][109198] Avg episode reward: [(0, '-1.245'), (1, '-3.042')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:42,626][63770] DAMAGECOUNT value on done: 9247.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:42,626][63770] Sum rewards: 0.185, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.372', 'AMMO2': '0.000', 'AMMO4': '0.002', 'AMMO5': '0.012', 'weapon5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.034', 'AMMO3': '0.088', 'HITCOUNT': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON5': '0.150', 'weapon7': '0.152', 'WEAPON7': '0.200', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.513', 'weapon3': '1.070', 'weapon2': '1.712', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:43,008][63770] DAMAGECOUNT value on done: 9780.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:43,009][63770] Sum rewards: 3.938, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.556', 'AMMO2': '0.003', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO4': '0.014', 'WEAPON1': '0.020', 'WEAPON5': '0.100', 'AMMO3': '0.144', 'HITCOUNT': '0.270', 'ARMOR': '0.440', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.068', 'weapon2': '1.488', 'weapon3': '1.986', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:44,571][63732] Updated weights for policy 0, policy_version 1870 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:45,503][63767] DAMAGECOUNT value on done: 12000.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:45,504][63767] Sum rewards: -1.403, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.090', 'ARMOR': '0.008', 'WEAPON1': '0.020', 'AMMO5': '0.022', 'AMMO2': '0.036', 'AMMO3': '0.118', 'HITCOUNT': '0.160', 'AMMO4': '0.182', 'weapon5': '0.266', 'weapon4': '0.288', 'WEAPON4': '0.300', 'WEAPON5': '0.500', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.071', 'weapon2': '1.468', 'weapon3': '1.648', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:45,819][63767] DAMAGECOUNT value on done: 11683.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:45,820][63767] Sum rewards: -2.329, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.316', 'AMMO4': '-0.017', 'AMMO2': '-0.003', 'AMMO5': '0.031', 'ARMOR': '0.032', 'AMMO3': '0.143', 'HITCOUNT': '0.210', 'weapon5': '0.270', 'WEAPON5': '0.450', 'DAMAGECOUNT': '0.813', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.562', 'weapon3': '1.896'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:46,570][63734] DAMAGECOUNT value on done: 10592.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:46,571][63734] Sum rewards: -4.890, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.944', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'ARMOR': '0.004', 'WEAPON1': '0.030', 'AMMO3': '0.098', 'WEAPON4': '0.100', 'HITCOUNT': '0.120', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.650', 'weapon3': '1.518', 'weapon2': '1.840', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:46,903][63734] DAMAGECOUNT value on done: 10427.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:46,903][63734] Sum rewards: -0.483, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.050', 'AMMO5': '0.003', 'AMMO2': '0.003', 'weapon5': '0.008', 'WEAPON1': '0.010', 'AMMO4': '0.015', 'WEAPON5': '0.050', 'ARMOR': '0.084', 'AMMO3': '0.125', 'HITCOUNT': '0.150', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.657', 'weapon2': '1.492', 'weapon3': '1.820', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:47,252][63805] DAMAGECOUNT value on done: 11703.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:47,252][63805] Sum rewards: -6.495, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-3.260', 'AMMO2': '0.003', 'AMMO4': '0.013', 'HITCOUNT': '0.020', 'DAMAGECOUNT': '0.045', 'WEAPON4': '0.100', 'ARMOR': '0.124', 'AMMO3': '0.200', 'weapon4': '0.230', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.444', 'weapon3': '1.636'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:47,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11332.3, 300 sec: 11371.6). Total num frames: 14917632. Throughput: 0: 1409.4, 1: 1407.1. Samples: 3720067. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:47,460][109198] Avg episode reward: [(0, '-1.209'), (1, '-2.966')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:47,467][63454] Saving new best policy, reward=-1.209!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:47,598][63805] DAMAGECOUNT value on done: 9243.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:47,599][63805] Sum rewards: -2.834, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.010', 'AMMO2': '0.004', 'weapon5': '0.006', 'ARMOR': '0.008', 'WEAPON1': '0.010', 'AMMO5': '0.010', 'AMMO4': '0.018', 'weapon4': '0.018', 'AMMO3': '0.088', 'WEAPON4': '0.100', 'HITCOUNT': '0.150', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.510', 'FRAGCOUNT': '1.000', 'weapon3': '1.214', 'weapon2': '1.840'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:48,717][63733] Updated weights for policy 1, policy_version 1770 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:49,773][63769] DAMAGECOUNT value on done: 10850.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:49,774][63769] Sum rewards: -5.423, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.966', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'ARMOR': '0.104', 'AMMO3': '0.127', 'HITCOUNT': '0.250', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.852', 'weapon2': '1.534', 'weapon3': '1.890', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:50,114][63769] DAMAGECOUNT value on done: 10003.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:50,133][63734] DAMAGECOUNT value on done: 10419.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:50,133][63734] Sum rewards: -3.554, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.856', 'AMMO2': '0.009', 'AMMO5': '0.022', 'ARMOR': '0.024', 'WEAPON1': '0.030', 'AMMO4': '0.045', 'weapon5': '0.146', 'AMMO3': '0.184', 'HITCOUNT': '0.270', 'WEAPON5': '0.350', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.966', 'weapon2': '1.096', 'FRAGCOUNT': '2.000', 'weapon3': '2.510'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:50,537][63734] DAMAGECOUNT value on done: 8696.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:50,538][63734] Sum rewards: 0.263, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.722', 'AMMO5': '0.015', 'AMMO2': '0.022', 'ARMOR': '0.032', 'WEAPON1': '0.040', 'AMMO4': '0.107', 'AMMO3': '0.136', 'weapon5': '0.306', 'HITCOUNT': '0.320', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'weapon2': '1.280', 'DAMAGECOUNT': '1.365', 'weapon3': '1.912', 'FRAGCOUNT': '3.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:51,846][63732] Updated weights for policy 0, policy_version 1880 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:52,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11264.0, 300 sec: 11357.7). Total num frames: 14970880. Throughput: 0: 1407.7, 1: 1405.5. Samples: 3736957. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:52,460][109198] Avg episode reward: [(0, '-1.188'), (1, '-3.063')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:52,462][63454] Saving new best policy, reward=-1.188!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:54,428][63767] DAMAGECOUNT value on done: 12722.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:54,429][63767] Sum rewards: -2.973, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.286', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.023', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'AMMO4': '0.116', 'weapon4': '0.150', 'AMMO3': '0.154', 'WEAPON5': '0.200', 'HITCOUNT': '0.310', 'weapon5': '0.398', 'WEAPON3': '0.850', 'weapon2': '1.040', 'DAMAGECOUNT': '1.407', 'FRAGCOUNT': '2.000', 'weapon3': '2.062'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:54,813][63767] DAMAGECOUNT value on done: 14453.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:54,814][63767] Sum rewards: -1.866, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.346', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'ARMOR': '0.129', 'AMMO3': '0.131', 'weapon4': '0.166', 'WEAPON5': '0.200', 'weapon5': '0.312', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.800', 'weapon2': '1.106', 'FRAGCOUNT': '1.500', 'weapon3': '1.928'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:55,482][63771] DAMAGECOUNT value on done: 9530.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:55,482][63771] Sum rewards: -0.622, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.892', 'AMMO4': '-0.041', 'AMMO2': '-0.008', 'AMMO5': '0.015', 'ARMOR': '0.044', 'HITCOUNT': '0.090', 'AMMO3': '0.112', 'weapon7': '0.142', 'weapon5': '0.168', 'WEAPON5': '0.200', 'AMMO6': '0.220', 'AMMO7': '0.220', 'WEAPON7': '0.300', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.376', 'weapon3': '1.412'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:55,846][63771] DAMAGECOUNT value on done: 11971.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:55,847][63771] Sum rewards: -6.492, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-3.000', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.007', 'WEAPON1': '0.030', 'weapon5': '0.088', 'WEAPON4': '0.100', 'weapon4': '0.120', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'AMMO3': '0.215', 'DAMAGECOUNT': '0.447', 'ARMOR': '0.457', 'WEAPON3': '1.000', 'weapon2': '1.508', 'weapon3': '1.996', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:55,857][63735] DAMAGECOUNT value on done: 9866.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:55,899][63733] Updated weights for policy 1, policy_version 1780 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:56,262][63735] DAMAGECOUNT value on done: 12303.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:56,263][63735] Sum rewards: -1.032, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.669', 'AMMO5': '0.007', 'AMMO2': '0.018', 'ARMOR': '0.048', 'WEAPON4': '0.050', 'AMMO4': '0.091', 'weapon4': '0.112', 'weapon5': '0.114', 'AMMO3': '0.138', 'WEAPON5': '0.150', 'HITCOUNT': '0.330', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.692', 'weapon2': '1.748', 'weapon3': '1.788', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:56,373][63806] DAMAGECOUNT value on done: 9487.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:56,373][63806] Sum rewards: 1.829, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.520', 'AMMO2': '0.008', 'AMMO5': '0.018', 'WEAPON1': '0.030', 'AMMO4': '0.041', 'ARMOR': '0.062', 'weapon4': '0.072', 'AMMO3': '0.109', 'WEAPON4': '0.200', 'weapon5': '0.248', 'WEAPON5': '0.350', 'HITCOUNT': '0.360', 'WEAPON3': '0.850', 'weapon2': '1.274', 'DAMAGECOUNT': '1.821', 'weapon3': '1.906', 'FRAGCOUNT': '3.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:56,482][63770] DAMAGECOUNT value on done: 12050.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:56,482][63770] Sum rewards: -0.791, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.860', 'AMMO2': '0.005', 'AMMO5': '0.019', 'WEAPON1': '0.020', 'AMMO4': '0.027', 'ARMOR': '0.056', 'AMMO3': '0.120', 'weapon4': '0.190', 'WEAPON4': '0.200', 'weapon5': '0.266', 'WEAPON5': '0.300', 'HITCOUNT': '0.300', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon2': '1.280', 'weapon3': '1.586'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:56,709][63806] DAMAGECOUNT value on done: 10425.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:56,929][63770] DAMAGECOUNT value on done: 8879.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:56,930][63770] Sum rewards: -3.220, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.711', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'AMMO4': '0.055', 'ARMOR': '0.064', 'AMMO3': '0.152', 'weapon4': '0.160', 'WEAPON4': '0.200', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.840', 'WEAPON3': '0.900', 'weapon2': '1.182', 'weapon3': '1.706', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:57,406][63735] DAMAGECOUNT value on done: 11011.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:57,406][63735] Sum rewards: -0.056, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.143', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.015', 'ARMOR': '0.028', 'WEAPON4': '0.100', 'weapon5': '0.110', 'AMMO3': '0.126', 'weapon4': '0.200', 'WEAPON5': '0.250', 'HITCOUNT': '0.320', 'weapon2': '0.832', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.629', 'weapon3': '2.440', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:57,430][63806] DAMAGECOUNT value on done: 10318.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:57,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11264.0, 300 sec: 11357.7). Total num frames: 15028224. Throughput: 0: 1408.7, 1: 1407.9. Samples: 3754065. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:58:57,459][109198] Avg episode reward: [(0, '-1.279'), (1, '-3.033')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:57,763][63806] DAMAGECOUNT value on done: 10165.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:57,763][63806] Sum rewards: -4.453, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.546', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.032', 'AMMO2': '-0.006', 'weapon5': '0.006', 'WEAPON1': '0.010', 'AMMO5': '0.014', 'ARMOR': '0.040', 'AMMO3': '0.112', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.720', 'WEAPON3': '0.750', 'weapon3': '1.430', 'weapon2': '1.668'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:57,791][63735] DAMAGECOUNT value on done: 8508.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:57,792][63735] Sum rewards: -3.598, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.036', 'AMMO5': '0.003', 'AMMO2': '0.012', 'weapon5': '0.012', 'WEAPON1': '0.020', 'WEAPON5': '0.050', 'AMMO4': '0.058', 'AMMO3': '0.074', 'ARMOR': '0.108', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'weapon4': '0.174', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon3': '1.300', 'weapon2': '1.738'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:58:59,031][63732] Updated weights for policy 0, policy_version 1890 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:00,008][63805] DAMAGECOUNT value on done: 11815.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:00,008][63805] Sum rewards: 2.489, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.042', 'AMMO2': '0.005', 'weapon7': '0.012', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.025', 'ARMOR': '0.076', 'AMMO3': '0.082', 'weapon4': '0.082', 'WEAPON4': '0.100', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.212', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'WEAPON3': '0.600', 'weapon3': '1.416', 'DAMAGECOUNT': '1.428', 'weapon2': '1.620', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:00,341][63805] DAMAGECOUNT value on done: 13087.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:00,341][63805] Sum rewards: 0.080, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.336', 'AMMO2': '0.007', 'AMMO5': '0.023', 'AMMO4': '0.036', 'WEAPON4': '0.050', 'ARMOR': '0.096', 'AMMO3': '0.168', 'weapon4': '0.194', 'HITCOUNT': '0.200', 'weapon5': '0.270', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.756', 'WEAPON3': '0.850', 'weapon2': '1.008', 'weapon3': '2.158', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:01,095][63771] DAMAGECOUNT value on done: 11342.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:01,096][63771] Sum rewards: -2.602, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.776', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.002', 'AMMO5': '0.007', 'AMMO4': '0.011', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'weapon5': '0.054', 'weapon4': '0.082', 'AMMO3': '0.111', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.500', 'weapon3': '1.506', 'weapon2': '1.530'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:01,441][63771] DAMAGECOUNT value on done: 8417.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:02,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11264.0, 300 sec: 11357.7). Total num frames: 15085568. Throughput: 0: 1407.0, 1: 1407.8. Samples: 3762565. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:02,460][109198] Avg episode reward: [(0, '-1.176'), (1, '-3.081')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:02,461][63454] Saving new best policy, reward=-1.176!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:03,124][63733] Updated weights for policy 1, policy_version 1790 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:05,229][63769] DAMAGECOUNT value on done: 11064.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:05,230][63769] Sum rewards: -4.439, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.656', 'AMMO2': '0.001', 'AMMO4': '0.006', 'AMMO5': '0.028', 'WEAPON1': '0.030', 'ARMOR': '0.056', 'AMMO3': '0.149', 'HITCOUNT': '0.150', 'DAMAGECOUNT': '0.465', 'weapon5': '0.496', 'WEAPON5': '0.650', 'WEAPON3': '0.950', 'weapon2': '1.204', 'weapon3': '1.782', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:05,679][63769] DAMAGECOUNT value on done: 8066.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:05,679][63769] Sum rewards: -5.789, reward structure: {'DEATHCOUNT': '-12.000', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO2': '0.009', 'ARMOR': '0.020', 'AMMO4': '0.045', 'WEAPON5': '0.050', 'HITCOUNT': '0.130', 'AMMO3': '0.166', 'HEALTH': '0.358', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.372', 'weapon3': '1.886'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:06,187][63732] Updated weights for policy 0, policy_version 1900 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:07,458][109198] Fps is (10 sec: 11058.9, 60 sec: 11195.7, 300 sec: 11329.9). Total num frames: 15138816. Throughput: 0: 1409.6, 1: 1407.0. Samples: 3779565. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:07,460][109198] Avg episode reward: [(0, '-1.193'), (1, '-3.084')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:07,993][63767] DAMAGECOUNT value on done: 12545.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:07,993][63767] Sum rewards: 0.904, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.700', 'AMMO2': '0.012', 'AMMO5': '0.020', 'WEAPON1': '0.020', 'ARMOR': '0.052', 'AMMO4': '0.061', 'weapon4': '0.092', 'AMMO3': '0.162', 'weapon5': '0.190', 'WEAPON4': '0.200', 'WEAPON5': '0.350', 'HITCOUNT': '0.440', 'WEAPON3': '0.850', 'weapon2': '1.336', 'DAMAGECOUNT': '1.635', 'weapon3': '1.934', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:08,307][63770] DAMAGECOUNT value on done: 9372.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:08,339][63767] DAMAGECOUNT value on done: 11995.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:08,339][63767] Sum rewards: 0.335, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.328', 'weapon7': '0.002', 'AMMO2': '0.009', 'AMMO5': '0.023', 'AMMO4': '0.043', 'WEAPON4': '0.100', 'AMMO3': '0.113', 'HITCOUNT': '0.130', 'weapon4': '0.186', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.322', 'WEAPON5': '0.450', 'ARMOR': '0.502', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.936', 'weapon3': '1.170', 'weapon2': '1.678', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:08,697][63770] DAMAGECOUNT value on done: 10379.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:08,697][63770] Sum rewards: 3.667, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.056', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'weapon7': '0.014', 'AMMO5': '0.017', 'ARMOR': '0.036', 'WEAPON1': '0.040', 'weapon5': '0.086', 'weapon4': '0.098', 'WEAPON4': '0.100', 'AMMO3': '0.137', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.250', 'HITCOUNT': '0.360', 'WEAPON3': '0.800', 'weapon2': '1.324', 'DAMAGECOUNT': '1.797', 'weapon3': '2.094', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:09,568][63734] DAMAGECOUNT value on done: 10822.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:09,568][63734] Sum rewards: -2.138, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.584', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.012', 'weapon4': '0.014', 'AMMO4': '0.059', 'ARMOR': '0.060', 'weapon7': '0.066', 'AMMO3': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.140', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.690', 'weapon2': '1.338', 'weapon3': '1.634', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:09,949][63734] DAMAGECOUNT value on done: 10814.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:09,950][63734] Sum rewards: -0.485, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.391', 'AMMO2': '0.007', 'weapon4': '0.020', 'AMMO4': '0.032', 'weapon7': '0.092', 'WEAPON4': '0.100', 'ARMOR': '0.110', 'AMMO3': '0.116', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'HITCOUNT': '0.210', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.161', 'weapon2': '1.414', 'weapon3': '1.804', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:10,070][63805] DAMAGECOUNT value on done: 11827.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:10,070][63805] Sum rewards: -4.719, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.629', 'AMMO2': '0.004', 'AMMO5': '0.005', 'ARMOR': '0.016', 'AMMO4': '0.019', 'WEAPON4': '0.100', 'HITCOUNT': '0.130', 'AMMO3': '0.156', 'DAMAGECOUNT': '0.372', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.534', 'weapon3': '1.724'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:10,387][63733] Updated weights for policy 1, policy_version 1800 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:10,446][63805] DAMAGECOUNT value on done: 9243.0\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:12,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11264.0, 300 sec: 11343.8). Total num frames: 15196160. Throughput: 0: 1412.8, 1: 1408.2. Samples: 3796627. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:12,460][109198] Avg episode reward: [(0, '-1.097'), (1, '-3.151')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:12,461][63454] Saving new best policy, reward=-1.097!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:13,066][63734] DAMAGECOUNT value on done: 10811.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:13,066][63734] Sum rewards: -0.674, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.850', 'AMMO2': '0.005', 'AMMO5': '0.005', 'AMMO4': '0.023', 'weapon7': '0.062', 'weapon5': '0.066', 'AMMO3': '0.076', 'WEAPON5': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.290', 'weapon4': '0.408', 'WEAPON3': '0.450', 'ARMOR': '0.525', 'weapon2': '0.758', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.176', 'weapon3': '1.342'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:13,110][63769] DAMAGECOUNT value on done: 10935.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:13,110][63769] Sum rewards: 0.167, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.007', 'AMMO2': '0.017', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'HITCOUNT': '0.080', 'AMMO4': '0.085', 'AMMO3': '0.088', 'WEAPON5': '0.100', 'weapon4': '0.186', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.450', 'HEALTH': '0.810', 'FRAGCOUNT': '1.000', 'weapon3': '1.216', 'weapon2': '1.782'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:13,405][63732] Updated weights for policy 0, policy_version 1910 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:13,436][63734] DAMAGECOUNT value on done: 8970.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:13,436][63734] Sum rewards: 2.195, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.304', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.038', 'ARMOR': '0.076', 'weapon5': '0.096', 'AMMO3': '0.103', 'HITCOUNT': '0.210', 'WEAPON5': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.822', 'weapon2': '1.330', 'FRAGCOUNT': '2.000', 'weapon3': '2.244'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:13,481][63769] DAMAGECOUNT value on done: 10103.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:16,722][63767] DAMAGECOUNT value on done: 13106.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:16,723][63767] Sum rewards: -4.449, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-2.000', 'HEALTH': '-0.353', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.024', 'ARMOR': '0.060', 'AMMO3': '0.145', 'WEAPON5': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.298', 'HITCOUNT': '0.350', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.152', 'weapon2': '1.288', 'weapon3': '2.122'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:17,085][63767] DAMAGECOUNT value on done: 14795.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:17,086][63767] Sum rewards: 0.318, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.473', 'AMMO5': '0.012', 'AMMO2': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'AMMO4': '0.070', 'AMMO3': '0.090', 'weapon5': '0.132', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'HITCOUNT': '0.200', 'weapon4': '0.202', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.026', 'weapon2': '1.326', 'weapon3': '1.708'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:17,458][109198] Fps is (10 sec: 11469.1, 60 sec: 11195.7, 300 sec: 11343.8). Total num frames: 15253504. Throughput: 0: 1413.7, 1: 1407.9. Samples: 3805127. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:17,460][109198] Avg episode reward: [(0, '-1.016'), (1, '-3.104')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:17,467][63454] Saving new best policy, reward=-1.016!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:17,600][63733] Updated weights for policy 1, policy_version 1810 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:18,511][63771] DAMAGECOUNT value on done: 9784.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:18,511][63771] Sum rewards: -0.413, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.520', 'AMMO4': '-0.013', 'AMMO2': '-0.002', 'AMMO5': '0.017', 'weapon5': '0.022', 'AMMO3': '0.133', 'HITCOUNT': '0.250', 'WEAPON5': '0.250', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.762', 'weapon2': '1.428', 'weapon3': '2.010', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:18,842][63771] DAMAGECOUNT value on done: 12140.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:18,842][63771] Sum rewards: -3.891, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.472', 'AMMO5': '0.020', 'AMMO2': '0.024', 'weapon5': '0.036', 'ARMOR': '0.076', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO4': '0.117', 'AMMO3': '0.125', 'weapon7': '0.134', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'weapon4': '0.212', 'WEAPON5': '0.300', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.507', 'weapon2': '1.244', 'weapon3': '1.606'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:19,785][63735] Large shaping reward -2.504 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.255, -85.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:19,886][63806] DAMAGECOUNT value on done: 10547.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:19,887][63806] Sum rewards: -0.702, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.266', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'weapon5': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.036', 'AMMO3': '0.102', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.687', 'FRAGCOUNT': '1.000', 'weapon2': '1.084', 'weapon3': '1.910'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:20,199][63806] DAMAGECOUNT value on done: 10230.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:20,496][63732] Updated weights for policy 0, policy_version 1920 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:20,802][63806] DAMAGECOUNT value on done: 10036.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:20,802][63806] Sum rewards: -2.265, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.274', 'weapon5': '0.002', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'WEAPON5': '0.050', 'ARMOR': '0.052', 'AMMO4': '0.087', 'WEAPON4': '0.100', 'AMMO3': '0.183', 'weapon4': '0.210', 'HITCOUNT': '0.480', 'WEAPON3': '0.900', 'weapon2': '1.536', 'DAMAGECOUNT': '1.647', 'weapon3': '1.732', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:20,805][63735] DAMAGECOUNT value on done: 10175.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:20,806][63735] Sum rewards: -6.058, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.470', 'AMMO4': '-0.058', 'AMMO2': '-0.012', 'AMMO5': '0.010', 'weapon5': '0.010', 'WEAPON1': '0.020', 'AMMO3': '0.117', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.927', 'weapon3': '1.670', 'weapon2': '1.778', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:21,239][63806] DAMAGECOUNT value on done: 10600.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:21,240][63806] Sum rewards: -1.699, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.246', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'AMMO5': '0.015', 'ARMOR': '0.032', 'weapon5': '0.060', 'AMMO3': '0.142', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.525', 'WEAPON3': '0.800', 'weapon2': '1.180', 'weapon3': '1.964', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:21,249][63735] DAMAGECOUNT value on done: 12458.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:21,249][63735] Sum rewards: -8.204, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-3.000', 'HEALTH': '-2.086', 'AMMO4': '-0.037', 'AMMO2': '-0.007', 'AMMO5': '0.021', 'WEAPON1': '0.030', 'ARMOR': '0.052', 'weapon5': '0.134', 'HITCOUNT': '0.140', 'AMMO3': '0.164', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.950', 'weapon2': '1.782', 'weapon3': '1.788'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:22,092][63770] DAMAGECOUNT value on done: 12755.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:22,092][63770] Sum rewards: 2.836, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.506', 'AMMO5': '0.013', 'AMMO2': '0.019', 'WEAPON4': '0.050', 'AMMO4': '0.096', 'AMMO3': '0.137', 'weapon4': '0.140', 'WEAPON5': '0.200', 'HITCOUNT': '0.290', 'weapon5': '0.350', 'ARMOR': '0.575', 'WEAPON3': '0.700', 'weapon3': '1.418', 'weapon2': '1.988', 'DAMAGECOUNT': '2.115', 'FRAGCOUNT': '3.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:22,328][63735] DAMAGECOUNT value on done: 11465.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:22,328][63735] Sum rewards: -0.634, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.324', 'AMMO2': '0.005', 'AMMO5': '0.008', 'weapon4': '0.016', 'AMMO4': '0.025', 'weapon5': '0.054', 'WEAPON4': '0.100', 'AMMO3': '0.129', 'WEAPON5': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.350', 'ARMOR': '0.507', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.362', 'weapon2': '1.666', 'weapon3': '1.918', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:22,429][63770] DAMAGECOUNT value on done: 8949.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:22,430][63770] Sum rewards: -1.526, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO5': '0.005', 'AMMO2': '0.011', 'WEAPON5': '0.050', 'AMMO4': '0.055', 'HITCOUNT': '0.060', 'AMMO3': '0.092', 'HEALTH': '0.140', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon3': '1.566', 'weapon2': '1.584'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:22,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11264.0, 300 sec: 11343.8). Total num frames: 15310848. Throughput: 0: 1420.0, 1: 1413.3. Samples: 3822467. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:22,460][109198] Avg episode reward: [(0, '-1.047'), (1, '-3.001')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:22,732][63735] DAMAGECOUNT value on done: 8583.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:22,897][63805] DAMAGECOUNT value on done: 12110.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:22,898][63805] Sum rewards: -0.125, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.122', 'AMMO2': '0.011', 'AMMO5': '0.017', 'AMMO4': '0.053', 'AMMO3': '0.102', 'weapon5': '0.204', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'ARMOR': '0.494', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.885', 'weapon2': '1.558', 'weapon3': '1.782'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:23,235][63805] DAMAGECOUNT value on done: 13314.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:23,236][63805] Sum rewards: -0.561, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.307', 'AMMO2': '0.014', 'AMMO5': '0.016', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'AMMO4': '0.070', 'AMMO3': '0.078', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon5': '0.184', 'weapon7': '0.196', 'HITCOUNT': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.681', 'FRAGCOUNT': '1.000', 'weapon3': '1.082', 'weapon2': '2.030'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:23,916][63771] DAMAGECOUNT value on done: 11452.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:23,916][63771] Sum rewards: -1.413, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.800', 'WEAPON1': '0.010', 'AMMO2': '0.028', 'HITCOUNT': '0.070', 'ARMOR': '0.080', 'AMMO3': '0.105', 'AMMO4': '0.138', 'WEAPON4': '0.250', 'weapon4': '0.268', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.088', 'weapon2': '1.420'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:24,309][63771] DAMAGECOUNT value on done: 8557.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:24,693][63733] Updated weights for policy 1, policy_version 1820 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:26,241][63769] Large shaping reward 2.632 for [('FRAGCOUNT', 2.0, 2.0), ('HITCOUNT', 0.03, 3.0), ('DAMAGECOUNT', 0.6, 200), ('weapon7', 0.002)]\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:27,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11264.0, 300 sec: 11343.8). Total num frames: 15368192. Throughput: 0: 1426.9, 1: 1423.1. Samples: 3839838. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:27,459][109198] Avg episode reward: [(0, '-1.084'), (1, '-3.001')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:27,487][63732] Updated weights for policy 0, policy_version 1930 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:29,933][63769] DAMAGECOUNT value on done: 11485.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:29,933][63769] Sum rewards: -2.360, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.344', 'AMMO2': '0.007', 'ARMOR': '0.024', 'AMMO5': '0.025', 'AMMO4': '0.033', 'weapon7': '0.074', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.140', 'AMMO3': '0.164', 'weapon5': '0.188', 'WEAPON7': '0.200', 'WEAPON5': '0.450', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.263', 'weapon2': '1.360', 'weapon3': '1.916', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:30,348][63769] DAMAGECOUNT value on done: 8136.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:30,349][63769] Sum rewards: -4.752, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.090', 'AMMO2': '0.012', 'ARMOR': '0.040', 'HITCOUNT': '0.060', 'AMMO4': '0.061', 'WEAPON4': '0.100', 'AMMO3': '0.107', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.558', 'weapon2': '1.640'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:30,406][63767] DAMAGECOUNT value on done: 12708.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:30,406][63767] Sum rewards: 0.455, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.434', 'AMMO5': '0.015', 'AMMO2': '0.029', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'ARMOR': '0.053', 'weapon7': '0.078', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon5': '0.108', 'AMMO3': '0.122', 'AMMO4': '0.143', 'HITCOUNT': '0.160', 'weapon4': '0.188', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.489', 'WEAPON3': '0.700', 'weapon2': '0.734', 'weapon3': '1.990', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:30,730][63767] DAMAGECOUNT value on done: 12075.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:31,551][63733] Updated weights for policy 1, policy_version 1830 (0.0009)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:32,458][109198] Fps is (10 sec: 11878.4, 60 sec: 11400.5, 300 sec: 11343.8). Total num frames: 15429632. Throughput: 0: 1429.3, 1: 1426.1. Samples: 3848559. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:32,460][109198] Avg episode reward: [(0, '-1.147'), (1, '-3.028')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:32,465][63734] DAMAGECOUNT value on done: 10857.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:32,466][63734] Sum rewards: -4.303, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.820', 'AMMO4': '-0.008', 'AMMO2': '-0.002', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'weapon5': '0.032', 'HITCOUNT': '0.040', 'DAMAGECOUNT': '0.105', 'AMMO3': '0.179', 'WEAPON5': '0.200', 'WEAPON3': '0.850', 'weapon2': '1.474', 'weapon3': '1.614', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:32,727][63805] DAMAGECOUNT value on done: 12096.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:32,727][63805] Sum rewards: -1.249, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.476', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.025', 'weapon5': '0.026', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'AMMO4': '0.127', 'AMMO3': '0.137', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'weapon4': '0.244', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.807', 'weapon2': '1.414', 'weapon3': '1.424', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:32,799][63734] DAMAGECOUNT value on done: 10999.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:32,799][63734] Sum rewards: -2.584, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.376', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'weapon5': '0.038', 'ARMOR': '0.048', 'AMMO3': '0.118', 'HITCOUNT': '0.150', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.452', 'weapon3': '1.892'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:33,101][63770] DAMAGECOUNT value on done: 9532.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:33,102][63770] Sum rewards: -2.753, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.675', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.013', 'weapon4': '0.032', 'ARMOR': '0.040', 'AMMO4': '0.067', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.131', 'HITCOUNT': '0.150', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.224', 'weapon3': '2.020'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:33,166][63805] DAMAGECOUNT value on done: 9448.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:33,167][63805] Sum rewards: -2.281, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.959', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'AMMO5': '0.010', 'weapon5': '0.022', 'ARMOR': '0.024', 'WEAPON5': '0.100', 'AMMO3': '0.146', 'HITCOUNT': '0.150', 'DAMAGECOUNT': '0.615', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.408', 'weapon2': '1.950'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:33,461][63770] DAMAGECOUNT value on done: 10909.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:33,461][63770] Sum rewards: -1.008, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.895', 'AMMO4': '-0.033', 'AMMO2': '-0.007', 'AMMO5': '0.031', 'weapon4': '0.054', 'weapon7': '0.056', 'WEAPON4': '0.100', 'AMMO3': '0.124', 'weapon5': '0.164', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.360', 'WEAPON5': '0.500', 'WEAPON3': '0.850', 'weapon2': '1.242', 'DAMAGECOUNT': '1.590', 'weapon3': '2.006', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:35,220][63732] Updated weights for policy 0, policy_version 1940 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:35,967][63734] DAMAGECOUNT value on done: 11371.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:35,968][63734] Sum rewards: 2.295, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.924', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'AMMO5': '0.010', 'ARMOR': '0.032', 'weapon5': '0.156', 'AMMO3': '0.214', 'WEAPON5': '0.250', 'HITCOUNT': '0.390', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.680', 'weapon2': '1.820', 'weapon3': '1.824', 'FRAGCOUNT': '6.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:36,263][63769] DAMAGECOUNT value on done: 11255.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:36,263][63769] Sum rewards: -4.545, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.577', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'AMMO5': '0.005', 'weapon5': '0.006', 'WEAPON1': '0.020', 'WEAPON5': '0.100', 'AMMO3': '0.149', 'HITCOUNT': '0.250', 'WEAPON3': '0.950', 'DAMAGECOUNT': '0.960', 'FRAGCOUNT': '1.000', 'weapon2': '1.324', 'weapon3': '2.050'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:36,352][63734] DAMAGECOUNT value on done: 9189.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:36,352][63734] Sum rewards: -0.589, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.825', 'AMMO4': '-0.023', 'AMMO2': '-0.005', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'weapon5': '0.030', 'ARMOR': '0.048', 'weapon7': '0.066', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.157', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.657', 'WEAPON3': '0.700', 'weapon2': '1.480', 'weapon3': '1.916', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:36,600][63769] DAMAGECOUNT value on done: 10500.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:36,601][63769] Sum rewards: 0.290, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.110', 'AMMO2': '0.022', 'weapon4': '0.028', 'WEAPON4': '0.050', 'weapon7': '0.092', 'AMMO3': '0.096', 'AMMO4': '0.108', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.200', 'WEAPON7': '0.200', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.170', 'weapon2': '1.302', 'weapon3': '1.492', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:37,458][109198] Fps is (10 sec: 11878.4, 60 sec: 11400.5, 300 sec: 11357.7). Total num frames: 15486976. Throughput: 0: 1411.0, 1: 1450.6. Samples: 3865727. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:37,460][109198] Avg episode reward: [(0, '-1.063'), (1, '-2.950')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:38,063][63733] Updated weights for policy 1, policy_version 1840 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:39,395][63767] DAMAGECOUNT value on done: 13386.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:39,396][63767] Sum rewards: -3.215, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.126', 'AMMO2': '0.001', 'AMMO4': '0.003', 'WEAPON1': '0.010', 'AMMO5': '0.025', 'ARMOR': '0.028', 'weapon5': '0.094', 'AMMO3': '0.178', 'HITCOUNT': '0.230', 'WEAPON5': '0.500', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.840', 'weapon2': '1.188', 'FRAGCOUNT': '2.000', 'weapon3': '2.264'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:39,733][63767] DAMAGECOUNT value on done: 15427.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:39,733][63767] Sum rewards: 3.520, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.560', 'AMMO5': '0.007', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'ARMOR': '0.024', 'AMMO4': '0.046', 'weapon7': '0.048', 'AMMO3': '0.107', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon5': '0.194', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.340', 'WEAPON3': '0.650', 'weapon3': '1.664', 'weapon2': '1.694', 'DAMAGECOUNT': '1.896', 'FRAGCOUNT': '3.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:41,294][63771] DAMAGECOUNT value on done: 10017.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:41,295][63771] Sum rewards: 1.262, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.242', 'WEAPON1': '0.010', 'AMMO5': '0.014', 'AMMO2': '0.019', 'ARMOR': '0.024', 'WEAPON4': '0.050', 'AMMO4': '0.096', 'AMMO3': '0.109', 'weapon4': '0.200', 'HITCOUNT': '0.220', 'WEAPON5': '0.300', 'weapon5': '0.334', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.699', 'weapon2': '0.910', 'weapon3': '1.668', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:41,647][63771] DAMAGECOUNT value on done: 12650.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:41,647][63771] Sum rewards: -1.335, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.236', 'weapon7': '0.002', 'ARMOR': '0.004', 'AMMO2': '0.004', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO4': '0.020', 'weapon5': '0.032', 'WEAPON5': '0.100', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'AMMO3': '0.205', 'HITCOUNT': '0.430', 'weapon2': '0.976', 'WEAPON3': '1.100', 'DAMAGECOUNT': '1.530', 'weapon3': '2.632', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:42,356][63806] DAMAGECOUNT value on done: 10647.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:42,356][63806] Sum rewards: -8.655, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-3.052', 'AMMO5': '0.007', 'weapon5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'ARMOR': '0.032', 'AMMO4': '0.055', 'HITCOUNT': '0.080', 'AMMO3': '0.109', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.436', 'weapon3': '1.696'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:42,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11400.5, 300 sec: 11343.8). Total num frames: 15544320. Throughput: 0: 1376.1, 1: 1484.0. Samples: 3882766. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:42,460][109198] Avg episode reward: [(0, '-0.894'), (1, '-3.009')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:42,461][63454] Saving new best policy, reward=-0.894!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:42,691][63806] DAMAGECOUNT value on done: 10492.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:42,691][63806] Sum rewards: 0.730, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.820', 'AMMO5': '0.007', 'AMMO2': '0.010', 'weapon5': '0.038', 'AMMO3': '0.045', 'weapon4': '0.046', 'AMMO4': '0.047', 'ARMOR': '0.068', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'HITCOUNT': '0.210', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.786', 'weapon3': '1.210', 'weapon2': '1.732', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:43,979][63732] Updated weights for policy 0, policy_version 1950 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:43,984][63733] Updated weights for policy 1, policy_version 1850 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:44,723][63806] DAMAGECOUNT value on done: 10264.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:44,724][63806] Sum rewards: -3.826, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.860', 'AMMO2': '0.006', 'AMMO5': '0.015', 'AMMO4': '0.030', 'WEAPON1': '0.040', 'AMMO3': '0.149', 'HITCOUNT': '0.150', 'weapon5': '0.178', 'WEAPON5': '0.300', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.684', 'WEAPON3': '0.750', 'weapon3': '1.512', 'weapon2': '1.720'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:44,937][63735] DAMAGECOUNT value on done: 10390.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:44,938][63735] Sum rewards: -2.671, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.836', 'AMMO2': '0.005', 'AMMO5': '0.015', 'weapon5': '0.022', 'ARMOR': '0.024', 'AMMO4': '0.027', 'WEAPON1': '0.080', 'AMMO3': '0.138', 'HITCOUNT': '0.180', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.900', 'weapon2': '1.214', 'weapon3': '1.914', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:45,103][63806] DAMAGECOUNT value on done: 10935.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:45,103][63806] Sum rewards: -1.803, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.912', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'WEAPON1': '0.040', 'ARMOR': '0.072', 'weapon4': '0.078', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'HITCOUNT': '0.270', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.005', 'weapon3': '1.056', 'weapon2': '1.784'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:45,327][63735] DAMAGECOUNT value on done: 13022.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:45,328][63735] Sum rewards: -0.495, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.804', 'weapon4': '0.006', 'AMMO2': '0.017', 'WEAPON1': '0.020', 'AMMO5': '0.020', 'ARMOR': '0.040', 'AMMO4': '0.086', 'WEAPON4': '0.100', 'weapon5': '0.156', 'AMMO3': '0.176', 'HITCOUNT': '0.260', 'WEAPON5': '0.300', 'WEAPON3': '0.900', 'weapon2': '1.350', 'DAMAGECOUNT': '1.692', 'weapon3': '1.936', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:45,646][63805] DAMAGECOUNT value on done: 12551.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:45,647][63805] Sum rewards: 3.179, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.485', 'AMMO2': '0.007', 'AMMO5': '0.012', 'AMMO4': '0.037', 'AMMO3': '0.164', 'weapon5': '0.186', 'WEAPON5': '0.200', 'HITCOUNT': '0.290', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.323', 'weapon2': '1.420', 'weapon3': '1.774', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:46,035][63805] DAMAGECOUNT value on done: 13688.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:46,035][63805] Sum rewards: 2.184, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.836', 'AMMO2': '0.016', 'weapon7': '0.016', 'AMMO5': '0.025', 'weapon5': '0.052', 'AMMO4': '0.077', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.163', 'WEAPON5': '0.300', 'HITCOUNT': '0.320', 'ARMOR': '0.432', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.927', 'weapon2': '1.348', 'weapon3': '2.294', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:46,355][63735] DAMAGECOUNT value on done: 11685.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:46,356][63735] Sum rewards: -3.556, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.155', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'AMMO5': '0.015', 'ARMOR': '0.028', 'weapon5': '0.094', 'AMMO3': '0.151', 'WEAPON5': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.220', 'DAMAGECOUNT': '0.660', 'WEAPON3': '0.950', 'weapon2': '1.480', 'weapon3': '1.972', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:46,793][63735] DAMAGECOUNT value on done: 8798.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:46,794][63735] Sum rewards: -5.196, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.270', 'ARMOR': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.011', 'weapon5': '0.026', 'AMMO4': '0.052', 'AMMO3': '0.140', 'WEAPON5': '0.150', 'HITCOUNT': '0.220', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.596', 'weapon3': '1.666'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:46,980][63770] DAMAGECOUNT value on done: 13021.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:46,981][63770] Sum rewards: -4.463, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.108', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.011', 'AMMO2': '0.022', 'ARMOR': '0.075', 'AMMO4': '0.109', 'weapon5': '0.124', 'AMMO3': '0.133', 'HITCOUNT': '0.200', 'weapon4': '0.218', 'WEAPON4': '0.250', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.798', 'WEAPON3': '0.900', 'weapon2': '1.154', 'weapon3': '1.850'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:47,226][63771] DAMAGECOUNT value on done: 11492.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:47,415][63770] DAMAGECOUNT value on done: 9164.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:47,415][63770] Sum rewards: -2.812, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.470', 'AMMO2': '0.001', 'AMMO4': '0.002', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'ARMOR': '0.016', 'WEAPON4': '0.050', 'weapon5': '0.050', 'weapon4': '0.118', 'HITCOUNT': '0.130', 'AMMO3': '0.149', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.800', 'weapon3': '1.288', 'weapon2': '1.494', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:47,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11332.3, 300 sec: 11330.0). Total num frames: 15597568. Throughput: 0: 1356.6, 1: 1500.7. Samples: 3891140. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:47,460][109198] Avg episode reward: [(0, '-0.870'), (1, '-3.011')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:47,468][63454] Saving new best policy, reward=-0.870!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:47,612][63771] DAMAGECOUNT value on done: 8604.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:50,229][63733] Updated weights for policy 1, policy_version 1860 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:52,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11400.5, 300 sec: 11330.0). Total num frames: 15654912. Throughput: 0: 1318.4, 1: 1533.1. Samples: 3907883. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:52,460][109198] Avg episode reward: [(0, '-0.870'), (1, '-3.025')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:53,006][63732] Updated weights for policy 0, policy_version 1960 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:53,551][63767] DAMAGECOUNT value on done: 12952.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:53,552][63767] Sum rewards: -0.276, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.472', 'AMMO2': '0.005', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'AMMO4': '0.024', 'ARMOR': '0.076', 'AMMO3': '0.098', 'HITCOUNT': '0.200', 'WEAPON5': '0.250', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.732', 'weapon3': '1.562', 'weapon2': '1.572', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:53,895][63767] DAMAGECOUNT value on done: 12399.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:53,896][63767] Sum rewards: -2.514, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.188', 'ARMOR': '0.004', 'AMMO2': '0.008', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO4': '0.041', 'AMMO3': '0.113', 'WEAPON5': '0.200', 'HITCOUNT': '0.250', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.972', 'weapon3': '1.558', 'weapon2': '1.848', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:55,183][63769] DAMAGECOUNT value on done: 11653.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:55,183][63769] Sum rewards: -4.674, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.057', 'AMMO5': '0.015', 'AMMO2': '0.029', 'ARMOR': '0.057', 'weapon5': '0.074', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'weapon7': '0.126', 'AMMO4': '0.142', 'AMMO3': '0.152', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.504', 'WEAPON3': '1.050', 'weapon2': '1.656', 'weapon3': '1.848', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:55,541][63769] DAMAGECOUNT value on done: 8324.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:55,979][63734] DAMAGECOUNT value on done: 11126.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:55,979][63734] Sum rewards: 1.627, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-1.046', 'weapon4': '0.004', 'AMMO5': '0.005', 'AMMO2': '0.026', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'AMMO3': '0.065', 'ARMOR': '0.076', 'WEAPON5': '0.100', 'weapon5': '0.100', 'AMMO4': '0.128', 'HITCOUNT': '0.180', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.807', 'weapon2': '1.530', 'weapon3': '1.562', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:56,071][63805] DAMAGECOUNT value on done: 12236.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:56,072][63805] Sum rewards: -1.372, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.050', 'AMMO4': '-0.019', 'AMMO2': '-0.004', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'AMMO3': '0.081', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.550', 'weapon3': '1.316', 'weapon2': '1.858', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:56,343][63733] Updated weights for policy 1, policy_version 1870 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:56,350][63734] DAMAGECOUNT value on done: 11169.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:56,351][63734] Sum rewards: -2.895, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.610', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO2': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.037', 'ARMOR': '0.040', 'WEAPON5': '0.100', 'AMMO3': '0.102', 'HITCOUNT': '0.150', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.600', 'weapon3': '1.412', 'weapon2': '1.726', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:56,442][63805] DAMAGECOUNT value on done: 9751.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:56,442][63805] Sum rewards: -0.807, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.180', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.010', 'ARMOR': '0.012', 'WEAPON5': '0.050', 'AMMO4': '0.050', 'weapon7': '0.086', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.133', 'WEAPON7': '0.200', 'HITCOUNT': '0.240', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.909', 'weapon2': '1.050', 'weapon3': '1.830', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:57,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11400.5, 300 sec: 11330.0). Total num frames: 15712256. Throughput: 0: 1283.1, 1: 1567.1. Samples: 3924888. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 14:59:57,460][109198] Avg episode reward: [(0, '-0.928'), (1, '-3.014')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:58,721][63734] DAMAGECOUNT value on done: 11783.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:58,722][63734] Sum rewards: -1.210, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.680', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.022', 'ARMOR': '0.045', 'weapon5': '0.094', 'AMMO3': '0.146', 'WEAPON5': '0.250', 'HITCOUNT': '0.270', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.236', 'weapon2': '1.470', 'FRAGCOUNT': '2.000', 'weapon3': '2.010'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:58,729][63770] DAMAGECOUNT value on done: 9681.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:59,042][63734] DAMAGECOUNT value on done: 9641.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:59,043][63734] Sum rewards: 3.247, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.264', 'AMMO5': '0.005', 'AMMO2': '0.010', 'weapon4': '0.028', 'AMMO4': '0.049', 'WEAPON4': '0.050', 'weapon5': '0.054', 'ARMOR': '0.072', 'WEAPON5': '0.100', 'AMMO3': '0.113', 'HITCOUNT': '0.330', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.356', 'weapon2': '1.356', 'weapon3': '1.888', 'FRAGCOUNT': '3.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:59,161][63770] DAMAGECOUNT value on done: 11480.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:59,162][63770] Sum rewards: 1.956, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO5': '0.015', 'AMMO2': '0.023', 'HEALTH': '0.034', 'ARMOR': '0.052', 'weapon7': '0.070', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.115', 'AMMO3': '0.118', 'weapon5': '0.136', 'WEAPON5': '0.250', 'weapon4': '0.350', 'HITCOUNT': '0.510', 'weapon2': '0.558', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.713', 'weapon3': '2.112', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:59,896][63769] DAMAGECOUNT value on done: 11496.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 14:59:59,896][63769] Sum rewards: -4.012, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.946', 'AMMO4': '-0.020', 'AMMO2': '-0.004', 'AMMO5': '0.010', 'HITCOUNT': '0.170', 'AMMO3': '0.181', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.723', 'WEAPON3': '1.050', 'weapon2': '1.088', 'FRAGCOUNT': '2.000', 'weapon3': '2.286'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:00,276][63769] DAMAGECOUNT value on done: 10785.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:00,276][63769] Sum rewards: -2.862, reward structure: {'DEATHCOUNT': '-9.750', 'AMMO2': '0.008', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'weapon5': '0.012', 'ARMOR': '0.028', 'AMMO4': '0.037', 'WEAPON4': '0.050', 'weapon4': '0.062', 'AMMO3': '0.144', 'WEAPON5': '0.150', 'HITCOUNT': '0.220', 'HEALTH': '0.260', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.855', 'FRAGCOUNT': '1.000', 'weapon2': '1.148', 'weapon3': '2.144'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:01,836][63732] Updated weights for policy 0, policy_version 1970 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:02,455][63767] DAMAGECOUNT value on done: 13560.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:02,456][63767] Sum rewards: -2.738, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.150', 'AMMO2': '0.009', 'AMMO5': '0.010', 'ARMOR': '0.016', 'WEAPON1': '0.030', 'weapon5': '0.032', 'AMMO4': '0.045', 'WEAPON4': '0.050', 'weapon4': '0.050', 'AMMO3': '0.087', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.522', 'FRAGCOUNT': '1.000', 'weapon3': '1.098', 'weapon2': '1.892'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:02,459][63733] Updated weights for policy 1, policy_version 1880 (0.0013)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:02,464][109198] Fps is (10 sec: 11462.7, 60 sec: 11399.5, 300 sec: 11329.8). Total num frames: 15769600. Throughput: 0: 1263.8, 1: 1585.4. Samples: 3933358. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:02,466][109198] Avg episode reward: [(0, '-0.866'), (1, '-3.008')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:02,469][63454] Saving new best policy, reward=-0.866!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:02,779][63767] DAMAGECOUNT value on done: 15627.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:02,780][63767] Sum rewards: -2.656, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.219', 'AMMO5': '0.005', 'AMMO2': '0.010', 'WEAPON1': '0.040', 'AMMO4': '0.049', 'WEAPON5': '0.100', 'ARMOR': '0.120', 'AMMO3': '0.173', 'HITCOUNT': '0.180', 'DAMAGECOUNT': '0.600', 'WEAPON3': '1.000', 'weapon2': '1.630', 'weapon3': '1.656', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:03,751][63771] DAMAGECOUNT value on done: 10331.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:03,751][63771] Sum rewards: -1.694, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.590', 'AMMO2': '0.014', 'AMMO5': '0.015', 'ARMOR': '0.045', 'AMMO4': '0.068', 'AMMO3': '0.134', 'weapon5': '0.196', 'WEAPON5': '0.250', 'HITCOUNT': '0.290', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.942', 'FRAGCOUNT': '1.000', 'weapon2': '1.310', 'weapon3': '2.132'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:04,082][63771] DAMAGECOUNT value on done: 13077.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:04,083][63771] Sum rewards: 1.615, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.558', 'AMMO2': '0.004', 'AMMO5': '0.007', 'weapon5': '0.008', 'AMMO4': '0.020', 'WEAPON5': '0.050', 'ARMOR': '0.068', 'weapon7': '0.094', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.135', 'weapon4': '0.196', 'WEAPON7': '0.200', 'HITCOUNT': '0.380', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.281', 'weapon2': '1.322', 'weapon3': '1.418', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:07,426][63806] DAMAGECOUNT value on done: 10926.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:07,426][63806] Sum rewards: -0.059, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.591', 'weapon5': '0.002', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'ARMOR': '0.040', 'AMMO4': '0.041', 'AMMO3': '0.083', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'HITCOUNT': '0.280', 'weapon4': '0.490', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.837', 'weapon2': '1.006', 'weapon3': '1.672', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:07,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11468.8, 300 sec: 11330.0). Total num frames: 15826944. Throughput: 0: 1222.9, 1: 1616.4. Samples: 3950237. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:07,460][109198] Avg episode reward: [(0, '-0.845'), (1, '-2.965')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:07,467][63454] Saving new best policy, reward=-0.845!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:07,801][63806] DAMAGECOUNT value on done: 10744.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:07,802][63806] Sum rewards: -0.325, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.230', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.023', 'weapon4': '0.098', 'WEAPON5': '0.100', 'AMMO3': '0.107', 'AMMO4': '0.114', 'ARMOR': '0.130', 'WEAPON4': '0.150', 'HITCOUNT': '0.220', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.756', 'weapon2': '0.888', 'FRAGCOUNT': '1.000', 'weapon3': '1.654'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:08,198][63805] DAMAGECOUNT value on done: 13111.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:08,198][63805] Sum rewards: -1.322, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.350', 'AMMO2': '0.010', 'AMMO5': '0.015', 'AMMO4': '0.052', 'ARMOR': '0.128', 'AMMO3': '0.153', 'WEAPON5': '0.250', 'HITCOUNT': '0.270', 'weapon5': '0.278', 'WEAPON3': '0.950', 'weapon3': '1.570', 'DAMAGECOUNT': '1.680', 'weapon2': '1.922', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:08,549][63805] DAMAGECOUNT value on done: 14094.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:08,550][63805] Sum rewards: 3.400, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.007', 'AMMO2': '0.010', 'ARMOR': '0.018', 'AMMO4': '0.047', 'WEAPON4': '0.050', 'weapon5': '0.066', 'AMMO3': '0.080', 'weapon7': '0.092', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.194', 'HITCOUNT': '0.220', 'HEALTH': '0.236', 'WEAPON3': '0.500', 'DAMAGECOUNT': '1.218', 'weapon2': '1.258', 'weapon3': '2.004', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:08,634][63733] Updated weights for policy 1, policy_version 1890 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:09,621][63735] DAMAGECOUNT value on done: 10498.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:09,621][63735] Sum rewards: -0.458, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.007', 'weapon5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.019', 'AMMO3': '0.067', 'AMMO4': '0.095', 'HITCOUNT': '0.120', 'WEAPON5': '0.150', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.324', 'HEALTH': '0.487', 'FRAGCOUNT': '1.000', 'weapon3': '1.120', 'weapon2': '1.832'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:09,859][63806] DAMAGECOUNT value on done: 10729.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:09,859][63806] Sum rewards: -3.922, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.277', 'AMMO4': '-0.008', 'AMMO2': '-0.001', 'AMMO5': '0.013', 'weapon5': '0.030', 'ARMOR': '0.060', 'WEAPON5': '0.150', 'AMMO3': '0.195', 'HITCOUNT': '0.380', 'WEAPON3': '1.100', 'weapon2': '1.310', 'DAMAGECOUNT': '1.395', 'weapon3': '2.482', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:10,003][63735] DAMAGECOUNT value on done: 13310.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:10,004][63735] Sum rewards: -0.366, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO5': '0.005', 'ARMOR': '0.008', 'AMMO2': '0.010', 'WEAPON4': '0.050', 'AMMO4': '0.051', 'WEAPON5': '0.100', 'weapon4': '0.100', 'AMMO3': '0.120', 'weapon5': '0.122', 'HITCOUNT': '0.240', 'HEALTH': '0.284', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.864', 'weapon2': '1.458', 'FRAGCOUNT': '2.000', 'weapon3': '2.022'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:10,279][63806] DAMAGECOUNT value on done: 11185.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:10,279][63806] Sum rewards: -1.372, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.014', 'AMMO4': '-0.000', 'AMMO2': '0.000', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'weapon4': '0.044', 'ARMOR': '0.048', 'WEAPON4': '0.050', 'AMMO3': '0.138', 'WEAPON5': '0.150', 'HITCOUNT': '0.240', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.750', 'weapon2': '1.276', 'weapon3': '1.718', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:10,279][63771] DAMAGECOUNT value on done: 11507.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:10,608][63771] DAMAGECOUNT value on done: 8994.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:10,609][63771] Sum rewards: -2.482, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.242', 'AMMO4': '-0.008', 'AMMO2': '-0.002', 'weapon5': '0.002', 'AMMO5': '0.007', 'ARMOR': '0.040', 'AMMO3': '0.142', 'WEAPON5': '0.150', 'HITCOUNT': '0.280', 'WEAPON3': '0.950', 'DAMAGECOUNT': '1.170', 'weapon2': '1.572', 'weapon3': '1.956', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:11,084][63735] DAMAGECOUNT value on done: 11893.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:11,085][63735] Sum rewards: -2.958, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.180', 'AMMO2': '0.003', 'AMMO5': '0.007', 'AMMO4': '0.012', 'weapon4': '0.068', 'WEAPON4': '0.100', 'AMMO3': '0.153', 'weapon5': '0.178', 'HITCOUNT': '0.200', 'WEAPON5': '0.250', 'WEAPON3': '0.500', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.624', 'weapon2': '1.252', 'weapon3': '1.874'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:11,204][63732] Updated weights for policy 0, policy_version 1980 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:11,545][63735] DAMAGECOUNT value on done: 9023.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:11,545][63735] Sum rewards: -4.348, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.358', 'weapon5': '0.014', 'AMMO2': '0.014', 'WEAPON1': '0.020', 'AMMO5': '0.023', 'ARMOR': '0.046', 'weapon4': '0.048', 'AMMO4': '0.070', 'WEAPON4': '0.100', 'AMMO3': '0.122', 'HITCOUNT': '0.160', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.616', 'weapon2': '1.702'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:12,458][109198] Fps is (10 sec: 11065.0, 60 sec: 11400.5, 300 sec: 11316.1). Total num frames: 15880192. Throughput: 0: 1168.5, 1: 1661.5. Samples: 3967189. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:12,461][109198] Avg episode reward: [(0, '-0.728'), (1, '-2.979')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:12,463][63454] Saving new best policy, reward=-0.728!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:12,649][63770] DAMAGECOUNT value on done: 13206.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:12,649][63770] Sum rewards: -0.320, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.507', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'ARMOR': '0.064', 'AMMO3': '0.093', 'HITCOUNT': '0.150', 'weapon5': '0.158', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.606', 'weapon3': '1.696'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:13,035][63770] DAMAGECOUNT value on done: 9389.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:13,036][63770] Sum rewards: 0.105, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.040', 'AMMO5': '0.013', 'ARMOR': '0.015', 'AMMO2': '0.016', 'WEAPON1': '0.030', 'weapon5': '0.036', 'AMMO4': '0.081', 'AMMO3': '0.085', 'WEAPON4': '0.100', 'weapon4': '0.180', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.675', 'weapon3': '0.986', 'FRAGCOUNT': '1.000', 'weapon2': '2.208'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:14,040][63733] Updated weights for policy 1, policy_version 1900 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:16,392][63767] DAMAGECOUNT value on done: 12952.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:16,704][63767] DAMAGECOUNT value on done: 12699.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:16,705][63767] Sum rewards: -1.932, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.330', 'AMMO2': '0.001', 'AMMO4': '0.005', 'AMMO5': '0.007', 'weapon5': '0.012', 'WEAPON1': '0.030', 'AMMO3': '0.128', 'WEAPON5': '0.150', 'HITCOUNT': '0.190', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.900', 'weapon2': '1.496', 'weapon3': '1.928', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:17,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11468.8, 300 sec: 11343.8). Total num frames: 15941632. Throughput: 0: 1137.0, 1: 1688.0. Samples: 3975682. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:17,460][109198] Avg episode reward: [(0, '-0.676'), (1, '-2.891')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:17,466][63454] Saving new best policy, reward=-0.676!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:19,365][63734] DAMAGECOUNT value on done: 11216.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:19,366][63734] Sum rewards: -0.874, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.007', 'AMMO2': '0.026', 'WEAPON1': '0.030', 'HEALTH': '0.050', 'weapon5': '0.054', 'ARMOR': '0.080', 'HITCOUNT': '0.090', 'weapon4': '0.094', 'AMMO3': '0.098', 'AMMO4': '0.129', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.400', 'weapon3': '1.194', 'weapon2': '1.754', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:19,431][63805] DAMAGECOUNT value on done: 12405.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:19,431][63805] Sum rewards: -3.583, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.495', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'weapon5': '0.006', 'AMMO5': '0.015', 'ARMOR': '0.068', 'AMMO3': '0.161', 'HITCOUNT': '0.170', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.850', 'weapon2': '1.574', 'FRAGCOUNT': '2.000', 'weapon3': '2.016'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:19,657][63733] Updated weights for policy 1, policy_version 1910 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:19,758][63734] DAMAGECOUNT value on done: 11184.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:19,823][63805] DAMAGECOUNT value on done: 10312.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:19,823][63805] Sum rewards: -2.775, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.820', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.036', 'AMMO3': '0.167', 'WEAPON5': '0.300', 'HITCOUNT': '0.450', 'WEAPON3': '0.950', 'weapon2': '1.454', 'DAMAGECOUNT': '1.683', 'weapon3': '1.740', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:20,261][63769] DAMAGECOUNT value on done: 11818.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:20,663][63769] DAMAGECOUNT value on done: 8461.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:20,663][63769] Sum rewards: -1.441, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.294', 'AMMO5': '0.010', 'AMMO2': '0.014', 'WEAPON1': '0.020', 'weapon5': '0.022', 'weapon4': '0.040', 'AMMO4': '0.071', 'ARMOR': '0.076', 'AMMO3': '0.100', 'WEAPON4': '0.100', 'HITCOUNT': '0.120', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.411', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.350', 'weapon3': '1.668'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:20,967][63734] DAMAGECOUNT value on done: 12324.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:20,968][63734] Sum rewards: -0.146, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.820', 'AMMO2': '0.008', 'AMMO5': '0.021', 'AMMO4': '0.037', 'WEAPON4': '0.050', 'AMMO3': '0.125', 'weapon5': '0.180', 'HITCOUNT': '0.310', 'WEAPON5': '0.450', 'WEAPON3': '0.700', 'weapon2': '1.230', 'DAMAGECOUNT': '1.623', 'FRAGCOUNT': '2.000', 'weapon3': '2.190'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:21,294][63734] DAMAGECOUNT value on done: 9935.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:21,295][63734] Sum rewards: -2.508, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.712', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.010', 'WEAPON4': '0.100', 'weapon4': '0.100', 'ARMOR': '0.108', 'AMMO3': '0.133', 'HITCOUNT': '0.140', 'WEAPON5': '0.200', 'weapon5': '0.330', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.882', 'weapon2': '1.510', 'weapon3': '1.628'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:21,609][63732] Updated weights for policy 0, policy_version 1990 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:22,458][109198] Fps is (10 sec: 11469.0, 60 sec: 11400.5, 300 sec: 11316.1). Total num frames: 15994880. Throughput: 0: 1098.9, 1: 1723.5. Samples: 3992735. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:22,460][109198] Avg episode reward: [(0, '-0.718'), (1, '-2.726')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:22,462][63576] Saving new best policy, reward=-2.726!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:23,676][63769] DAMAGECOUNT value on done: 11696.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:23,676][63769] Sum rewards: -0.950, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.202', 'AMMO4': '-0.045', 'AMMO2': '-0.009', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'weapon5': '0.036', 'ARMOR': '0.044', 'WEAPON5': '0.100', 'AMMO3': '0.147', 'HITCOUNT': '0.220', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.900', 'weapon2': '1.398', 'weapon3': '1.836', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:24,008][63770] DAMAGECOUNT value on done: 9981.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:24,009][63770] Sum rewards: -4.953, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.305', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'weapon5': '0.002', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'ARMOR': '0.040', 'WEAPON5': '0.100', 'AMMO3': '0.153', 'HITCOUNT': '0.250', 'DAMAGECOUNT': '0.900', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.296', 'weapon3': '2.162'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:24,062][63769] DAMAGECOUNT value on done: 10995.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:24,063][63769] Sum rewards: -2.662, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.006', 'AMMO2': '0.004', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO4': '0.022', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'weapon4': '0.114', 'HITCOUNT': '0.130', 'AMMO3': '0.147', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.850', 'weapon2': '0.974', 'FRAGCOUNT': '2.000', 'weapon3': '2.240'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:24,365][63770] DAMAGECOUNT value on done: 11844.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:24,365][63770] Sum rewards: 3.271, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.695', 'AMMO2': '0.004', 'AMMO5': '0.007', 'AMMO4': '0.019', 'ARMOR': '0.056', 'weapon5': '0.074', 'AMMO3': '0.112', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'weapon7': '0.308', 'HITCOUNT': '0.310', 'weapon4': '0.336', 'AMMO6': '0.400', 'WEAPON7': '0.400', 'AMMO7': '0.400', 'WEAPON3': '0.650', 'weapon2': '0.788', 'DAMAGECOUNT': '1.092', 'weapon3': '1.810', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:25,094][63733] Updated weights for policy 1, policy_version 1920 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:25,389][63767] DAMAGECOUNT value on done: 13586.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:25,670][63771] DAMAGECOUNT value on done: 10663.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:25,670][63771] Sum rewards: 1.448, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.384', 'AMMO5': '0.010', 'AMMO2': '0.015', 'WEAPON5': '0.050', 'AMMO4': '0.075', 'AMMO3': '0.104', 'weapon5': '0.114', 'WEAPON4': '0.150', 'weapon4': '0.176', 'HITCOUNT': '0.290', 'ARMOR': '0.468', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.996', 'weapon3': '1.178', 'weapon2': '1.606', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:25,796][63767] DAMAGECOUNT value on done: 15742.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:26,069][63805] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:26,079][63771] DAMAGECOUNT value on done: 13680.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:26,079][63771] Sum rewards: 6.388, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'AMMO5': '0.007', 'ARMOR': '0.008', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'weapon7': '0.050', 'AMMO3': '0.070', 'weapon5': '0.078', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon4': '0.124', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HEALTH': '0.307', 'WEAPON3': '0.350', 'HITCOUNT': '0.400', 'weapon2': '1.092', 'weapon3': '1.384', 'DAMAGECOUNT': '1.809', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:27,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11400.5, 300 sec: 11329.9). Total num frames: 16052224. Throughput: 0: 1067.7, 1: 1751.2. Samples: 4009620. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:27,460][109198] Avg episode reward: [(0, '-0.596'), (1, '-2.750')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:27,467][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001924_7880704.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:27,467][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001995_8171520.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:27,538][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001669_6836224.pth\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:27,539][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001586_6496256.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:27,548][63454] Saving new best policy, reward=-0.596!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:30,306][63733] Updated weights for policy 1, policy_version 1930 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:31,394][63805] DAMAGECOUNT value on done: 13357.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:31,394][63805] Sum rewards: -3.185, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.542', 'AMMO5': '0.003', 'AMMO2': '0.013', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'AMMO4': '0.067', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'weapon4': '0.132', 'HITCOUNT': '0.230', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.738', 'FRAGCOUNT': '1.000', 'weapon3': '1.136', 'weapon2': '2.082'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:31,719][63805] DAMAGECOUNT value on done: 14294.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:31,719][63805] Sum rewards: -6.637, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.126', 'AMMO2': '0.002', 'AMMO5': '0.007', 'AMMO4': '0.011', 'weapon5': '0.026', 'WEAPON1': '0.060', 'AMMO3': '0.102', 'WEAPON5': '0.150', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.650', 'weapon2': '1.474', 'weapon3': '1.696'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:32,016][63806] DAMAGECOUNT value on done: 10941.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:32,016][63806] Sum rewards: -2.193, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.624', 'AMMO5': '0.003', 'AMMO2': '0.008', 'HITCOUNT': '0.010', 'WEAPON1': '0.010', 'weapon5': '0.012', 'AMMO4': '0.041', 'DAMAGECOUNT': '0.045', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'AMMO3': '0.084', 'weapon4': '0.130', 'ARMOR': '0.176', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.282', 'weapon2': '1.780'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:32,434][63806] DAMAGECOUNT value on done: 11122.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:32,435][63806] Sum rewards: -2.234, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.681', 'AMMO2': '0.006', 'AMMO5': '0.020', 'AMMO4': '0.032', 'ARMOR': '0.044', 'weapon4': '0.118', 'weapon5': '0.130', 'AMMO3': '0.135', 'WEAPON4': '0.150', 'HITCOUNT': '0.280', 'WEAPON5': '0.350', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.134', 'weapon2': '1.452', 'weapon3': '1.596'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:32,458][109198] Fps is (10 sec: 11468.6, 60 sec: 11332.2, 300 sec: 11316.1). Total num frames: 16109568. Throughput: 0: 1045.5, 1: 1774.9. Samples: 4018055. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:32,460][109198] Avg episode reward: [(0, '-0.613'), (1, '-2.823')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:33,581][63732] Updated weights for policy 0, policy_version 2000 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:33,785][63771] DAMAGECOUNT value on done: 11627.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:33,785][63771] Sum rewards: 0.978, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.040', 'weapon4': '0.010', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'AMMO2': '0.015', 'weapon5': '0.022', 'weapon7': '0.076', 'AMMO4': '0.076', 'HITCOUNT': '0.080', 'AMMO3': '0.087', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.650', 'weapon2': '1.182', 'weapon3': '1.844', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:33,925][63735] DAMAGECOUNT value on done: 10503.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:34,161][63771] DAMAGECOUNT value on done: 9219.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:34,162][63771] Sum rewards: -5.378, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.644', 'AMMO5': '0.007', 'weapon5': '0.012', 'AMMO2': '0.015', 'weapon4': '0.018', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'AMMO4': '0.074', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'AMMO3': '0.225', 'DAMAGECOUNT': '0.675', 'weapon2': '0.720', 'WEAPON3': '1.200', 'FRAGCOUNT': '2.000', 'weapon3': '2.670'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:34,253][63735] DAMAGECOUNT value on done: 13593.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:34,253][63735] Sum rewards: 2.282, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-0.238', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'AMMO3': '0.050', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon7': '0.154', 'HITCOUNT': '0.190', 'WEAPON7': '0.200', 'weapon5': '0.268', 'WEAPON5': '0.300', 'WEAPON3': '0.350', 'FRAGCOUNT': '0.500', 'ARMOR': '0.504', 'DAMAGECOUNT': '0.849', 'weapon3': '1.194', 'weapon2': '1.452'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:34,477][63806] DAMAGECOUNT value on done: 11090.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:34,477][63806] Sum rewards: -4.599, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.358', 'AMMO5': '0.016', 'AMMO2': '0.019', 'ARMOR': '0.072', 'AMMO4': '0.096', 'weapon5': '0.100', 'AMMO3': '0.188', 'HITCOUNT': '0.200', 'WEAPON4': '0.200', 'WEAPON5': '0.350', 'DAMAGECOUNT': '1.083', 'WEAPON3': '1.150', 'weapon2': '1.574', 'weapon3': '1.960', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:34,828][63806] DAMAGECOUNT value on done: 11338.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:34,829][63806] Sum rewards: -4.345, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.128', 'AMMO5': '0.003', 'AMMO2': '0.013', 'weapon4': '0.018', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.065', 'ARMOR': '0.076', 'AMMO3': '0.157', 'HITCOUNT': '0.160', 'DAMAGECOUNT': '0.459', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.760', 'weapon2': '1.872'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:35,420][63735] DAMAGECOUNT value on done: 12302.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:35,420][63735] Sum rewards: 0.944, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.898', 'AMMO2': '0.006', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.027', 'weapon5': '0.034', 'weapon7': '0.074', 'ARMOR': '0.104', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.121', 'WEAPON5': '0.150', 'WEAPON7': '0.200', 'WEAPON4': '0.250', 'HITCOUNT': '0.350', 'weapon4': '0.388', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.227', 'weapon3': '1.610', 'weapon2': '1.634', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:35,497][63733] Updated weights for policy 1, policy_version 1940 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:35,790][63735] DAMAGECOUNT value on done: 9217.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:35,791][63735] Sum rewards: -0.620, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.034', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'AMMO5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'weapon5': '0.070', 'AMMO3': '0.117', 'HITCOUNT': '0.210', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.582', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.688', 'weapon2': '1.774'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:37,458][109198] Fps is (10 sec: 10649.6, 60 sec: 11195.7, 300 sec: 11288.3). Total num frames: 16158720. Throughput: 0: 998.5, 1: 1819.0. Samples: 4034668. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:37,460][109198] Avg episode reward: [(0, '-0.645'), (1, '-2.823')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:38,050][63770] DAMAGECOUNT value on done: 13646.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:38,051][63770] Sum rewards: 1.800, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.986', 'AMMO2': '0.002', 'AMMO4': '0.008', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.062', 'AMMO3': '0.127', 'weapon5': '0.140', 'HITCOUNT': '0.190', 'AMMO6': '0.240', 'AMMO7': '0.240', 'weapon7': '0.292', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon4': '0.366', 'WEAPON7': '0.400', 'WEAPON3': '0.850', 'weapon2': '1.270', 'DAMAGECOUNT': '1.320', 'weapon3': '1.394', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:38,441][63770] DAMAGECOUNT value on done: 9455.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:39,882][63767] DAMAGECOUNT value on done: 13170.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:39,883][63767] Sum rewards: -3.295, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.420', 'AMMO2': '0.012', 'WEAPON1': '0.040', 'AMMO4': '0.060', 'ARMOR': '0.112', 'AMMO3': '0.115', 'WEAPON4': '0.150', 'HITCOUNT': '0.160', 'weapon4': '0.328', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.654', 'FRAGCOUNT': '1.000', 'weapon3': '1.414', 'weapon2': '1.680'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:40,272][63767] DAMAGECOUNT value on done: 12808.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:40,573][63733] Updated weights for policy 1, policy_version 1950 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:42,458][109198] Fps is (10 sec: 10649.8, 60 sec: 11195.7, 300 sec: 11302.2). Total num frames: 16216064. Throughput: 0: 949.6, 1: 1862.6. Samples: 4051438. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:42,460][109198] Avg episode reward: [(0, '-0.583'), (1, '-2.918')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:42,461][63454] Saving new best policy, reward=-0.583!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:42,892][63734] DAMAGECOUNT value on done: 12891.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:42,893][63734] Sum rewards: -0.610, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.267', 'AMMO5': '0.005', 'AMMO2': '0.014', 'weapon5': '0.052', 'AMMO4': '0.067', 'AMMO3': '0.125', 'WEAPON5': '0.150', 'weapon4': '0.308', 'WEAPON4': '0.350', 'HITCOUNT': '0.460', 'ARMOR': '0.571', 'WEAPON3': '0.850', 'weapon2': '1.518', 'DAMAGECOUNT': '1.701', 'weapon3': '1.736', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:43,030][63805] DAMAGECOUNT value on done: 12610.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:43,030][63805] Sum rewards: -1.170, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.730', 'weapon5': '0.002', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.010', 'ARMOR': '0.024', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.051', 'AMMO3': '0.121', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.615', 'WEAPON3': '0.750', 'weapon2': '1.090', 'FRAGCOUNT': '2.000', 'weapon3': '2.114'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:43,208][63734] DAMAGECOUNT value on done: 10616.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:43,208][63734] Sum rewards: 4.440, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.457', 'AMMO5': '0.005', 'AMMO2': '0.006', 'AMMO4': '0.030', 'WEAPON5': '0.100', 'weapon5': '0.106', 'AMMO3': '0.113', 'HITCOUNT': '0.460', 'ARMOR': '0.502', 'WEAPON3': '0.650', 'weapon3': '1.540', 'DAMAGECOUNT': '2.043', 'weapon2': '2.092', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:43,257][63734] DAMAGECOUNT value on done: 11316.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:43,386][63805] DAMAGECOUNT value on done: 10387.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:43,616][63734] DAMAGECOUNT value on done: 11561.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:43,616][63734] Sum rewards: 0.436, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.645', 'AMMO5': '0.005', 'AMMO2': '0.013', 'AMMO4': '0.065', 'weapon4': '0.088', 'WEAPON5': '0.100', 'ARMOR': '0.120', 'AMMO3': '0.134', 'WEAPON4': '0.200', 'HITCOUNT': '0.260', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.131', 'weapon3': '1.558', 'weapon2': '1.906', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:45,494][63769] DAMAGECOUNT value on done: 11943.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:45,672][63733] Updated weights for policy 1, policy_version 1960 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:45,893][63769] DAMAGECOUNT value on done: 8730.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:45,894][63769] Sum rewards: 1.501, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.747', 'AMMO5': '0.010', 'AMMO2': '0.018', 'WEAPON1': '0.030', 'ARMOR': '0.044', 'AMMO3': '0.084', 'AMMO4': '0.091', 'weapon6': '0.092', 'HITCOUNT': '0.160', 'AMMO6': '0.194', 'AMMO7': '0.194', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON6': '0.200', 'weapon4': '0.252', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.807', 'weapon3': '1.310', 'weapon2': '1.562', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:46,484][63732] Updated weights for policy 0, policy_version 2010 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:47,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11264.0, 300 sec: 11288.3). Total num frames: 16273408. Throughput: 0: 926.8, 1: 1883.6. Samples: 4059809. Policy #0 lag: (min: 0.0, avg: 0.1, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:47,460][109198] Avg episode reward: [(0, '-0.464'), (1, '-2.837')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:47,467][63454] Saving new best policy, reward=-0.464!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:47,894][63769] DAMAGECOUNT value on done: 11725.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:47,894][63769] Sum rewards: -5.506, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.023', 'AMMO2': '0.001', 'AMMO5': '0.003', 'AMMO4': '0.006', 'weapon5': '0.008', 'HITCOUNT': '0.050', 'WEAPON5': '0.050', 'DAMAGECOUNT': '0.087', 'ARMOR': '0.090', 'AMMO3': '0.094', 'WEAPON3': '0.600', 'weapon3': '1.094', 'weapon2': '2.434'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:48,235][63769] DAMAGECOUNT value on done: 11171.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:49,127][63767] DAMAGECOUNT value on done: 13741.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:49,402][63770] DAMAGECOUNT value on done: 10426.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:49,403][63770] Sum rewards: 5.023, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.410', 'AMMO5': '0.005', 'AMMO2': '0.013', 'weapon5': '0.056', 'AMMO4': '0.063', 'AMMO3': '0.099', 'WEAPON5': '0.100', 'ARMOR': '0.108', 'WEAPON4': '0.200', 'HITCOUNT': '0.340', 'weapon4': '0.394', 'WEAPON3': '0.700', 'weapon3': '1.250', 'DAMAGECOUNT': '1.335', 'weapon2': '1.770', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:49,538][63771] DAMAGECOUNT value on done: 10808.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:49,539][63771] Sum rewards: -0.457, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.085', 'AMMO4': '-0.055', 'AMMO2': '-0.011', 'AMMO5': '0.005', 'weapon5': '0.046', 'AMMO3': '0.060', 'ARMOR': '0.088', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.480', 'weapon2': '2.120'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:49,539][63767] DAMAGECOUNT value on done: 16023.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:49,539][63767] Sum rewards: 0.239, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.196', 'AMMO2': '0.015', 'AMMO5': '0.020', 'WEAPON1': '0.020', 'weapon5': '0.038', 'ARMOR': '0.040', 'AMMO4': '0.076', 'AMMO3': '0.131', 'HITCOUNT': '0.250', 'WEAPON5': '0.300', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.843', 'weapon2': '1.466', 'weapon3': '1.936', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:49,810][63770] DAMAGECOUNT value on done: 12432.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:49,810][63770] Sum rewards: 8.596, reward structure: {'DEATHCOUNT': '-3.000', 'AMMO2': '0.007', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.035', 'AMMO3': '0.060', 'WEAPON5': '0.100', 'HITCOUNT': '0.260', 'HEALTH': '0.282', 'weapon5': '0.320', 'WEAPON3': '0.350', 'ARMOR': '0.827', 'weapon2': '1.112', 'weapon3': '1.458', 'DAMAGECOUNT': '1.764', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:49,913][63771] DAMAGECOUNT value on done: 13850.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:51,029][63733] Updated weights for policy 1, policy_version 1970 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:52,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11264.0, 300 sec: 11288.3). Total num frames: 16330752. Throughput: 0: 888.5, 1: 1916.8. Samples: 4076474. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:52,460][109198] Avg episode reward: [(0, '-0.363'), (1, '-2.707')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:52,462][63576] Saving new best policy, reward=-2.707!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:52,462][63454] Saving new best policy, reward=-0.363!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:55,449][63805] DAMAGECOUNT value on done: 13607.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:55,811][63805] DAMAGECOUNT value on done: 14544.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:55,811][63805] Sum rewards: 0.105, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO5': '0.007', 'weapon5': '0.018', 'AMMO2': '0.021', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'AMMO3': '0.061', 'weapon4': '0.070', 'WEAPON5': '0.100', 'AMMO4': '0.104', 'HITCOUNT': '0.200', 'WEAPON3': '0.350', 'HEALTH': '0.728', 'DAMAGECOUNT': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.364', 'weapon2': '2.002'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:56,521][63733] Updated weights for policy 1, policy_version 1980 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:56,787][63806] DAMAGECOUNT value on done: 11298.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:56,788][63806] Sum rewards: -2.743, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.528', 'weapon5': '0.002', 'AMMO2': '0.005', 'AMMO5': '0.018', 'AMMO4': '0.025', 'ARMOR': '0.040', 'AMMO3': '0.156', 'WEAPON5': '0.250', 'HITCOUNT': '0.270', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.071', 'weapon3': '1.306', 'weapon2': '2.142', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:57,252][63806] DAMAGECOUNT value on done: 11393.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:57,252][63806] Sum rewards: -4.469, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.994', 'FRAGCOUNT': '-1.000', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.017', 'WEAPON4': '0.100', 'AMMO3': '0.158', 'weapon4': '0.168', 'weapon5': '0.188', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.230', 'WEAPON5': '0.250', 'ARMOR': '0.539', 'DAMAGECOUNT': '0.813', 'weapon2': '1.032', 'WEAPON3': '1.100', 'weapon3': '2.304'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:57,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11195.7, 300 sec: 11274.4). Total num frames: 16384000. Throughput: 0: 865.9, 1: 1925.0. Samples: 4092780. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:00:57,460][109198] Avg episode reward: [(0, '-0.408'), (1, '-2.684')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:57,468][63576] Saving new best policy, reward=-2.684!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:58,398][63732] Updated weights for policy 0, policy_version 2020 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:58,444][63806] DAMAGECOUNT value on done: 11231.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:58,445][63806] Sum rewards: -6.906, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.752', 'AMMO2': '0.007', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.032', 'weapon5': '0.036', 'WEAPON4': '0.050', 'weapon4': '0.056', 'ARMOR': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.155', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.423', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.364', 'weapon3': '2.178'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:58,703][63735] DAMAGECOUNT value on done: 10853.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:58,703][63735] Sum rewards: -2.617, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.813', 'AMMO2': '0.003', 'AMMO4': '0.016', 'ARMOR': '0.092', 'WEAPON4': '0.100', 'AMMO3': '0.115', 'weapon4': '0.136', 'HITCOUNT': '0.310', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.050', 'weapon2': '1.478', 'FRAGCOUNT': '2.000', 'weapon3': '2.046'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:58,840][63806] DAMAGECOUNT value on done: 11593.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:58,840][63806] Sum rewards: -2.235, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.172', 'AMMO2': '0.019', 'WEAPON1': '0.020', 'AMMO5': '0.023', 'weapon5': '0.048', 'AMMO4': '0.094', 'WEAPON4': '0.100', 'AMMO3': '0.145', 'HITCOUNT': '0.220', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.765', 'WEAPON3': '0.800', 'weapon2': '1.512', 'weapon3': '1.842', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:58,873][63771] DAMAGECOUNT value on done: 11802.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:58,874][63771] Sum rewards: -2.729, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.724', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO2': '0.020', 'weapon4': '0.046', 'weapon5': '0.052', 'ARMOR': '0.096', 'AMMO4': '0.101', 'AMMO3': '0.123', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.525', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.554', 'weapon3': '1.720'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:59,117][63735] DAMAGECOUNT value on done: 13983.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:59,118][63735] Sum rewards: -0.375, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.814', 'AMMO5': '0.007', 'AMMO2': '0.009', 'WEAPON1': '0.020', 'weapon4': '0.026', 'ARMOR': '0.040', 'AMMO4': '0.047', 'weapon5': '0.084', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'AMMO3': '0.174', 'HITCOUNT': '0.300', 'WEAPON3': '0.850', 'weapon2': '1.160', 'DAMAGECOUNT': '1.170', 'weapon3': '2.302', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:59,257][63771] DAMAGECOUNT value on done: 9428.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:00:59,258][63771] Sum rewards: -1.382, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.452', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.012', 'weapon5': '0.038', 'weapon4': '0.044', 'WEAPON4': '0.050', 'ARMOR': '0.056', 'AMMO4': '0.061', 'AMMO3': '0.088', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.627', 'weapon3': '1.346', 'FRAGCOUNT': '2.000', 'weapon2': '2.118'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:00,246][63735] DAMAGECOUNT value on done: 12717.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:00,246][63735] Sum rewards: -1.082, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.780', 'AMMO4': '-0.014', 'AMMO2': '-0.003', 'ARMOR': '0.012', 'AMMO5': '0.015', 'weapon5': '0.064', 'weapon7': '0.082', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.128', 'WEAPON7': '0.200', 'HITCOUNT': '0.240', 'WEAPON5': '0.300', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.245', 'weapon2': '1.534', 'weapon3': '1.654', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:00,629][63735] DAMAGECOUNT value on done: 9297.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:00,629][63735] Sum rewards: -5.717, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.284', 'AMMO4': '-0.014', 'AMMO2': '-0.003', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'weapon5': '0.020', 'ARMOR': '0.032', 'HITCOUNT': '0.090', 'WEAPON5': '0.100', 'AMMO3': '0.165', 'DAMAGECOUNT': '0.240', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.334', 'weapon2': '2.278'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:02,001][63733] Updated weights for policy 1, policy_version 1990 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:02,458][109198] Fps is (10 sec: 11059.4, 60 sec: 11196.7, 300 sec: 11274.4). Total num frames: 16441344. Throughput: 0: 855.5, 1: 1925.9. Samples: 4100845. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:02,459][109198] Avg episode reward: [(0, '-0.438'), (1, '-2.683')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:03,610][63770] DAMAGECOUNT value on done: 13990.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:03,610][63770] Sum rewards: 0.658, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.760', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.020', 'AMMO2': '0.024', 'weapon5': '0.048', 'AMMO3': '0.079', 'AMMO4': '0.122', 'WEAPON4': '0.150', 'WEAPON5': '0.250', 'HITCOUNT': '0.320', 'WEAPON3': '0.350', 'weapon4': '0.354', 'DAMAGECOUNT': '1.032', 'weapon2': '1.264', 'weapon3': '1.370', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:03,796][63767] DAMAGECOUNT value on done: 13305.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:03,797][63767] Sum rewards: -2.925, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.512', 'ARMOR': '0.008', 'weapon5': '0.010', 'AMMO5': '0.015', 'AMMO2': '0.024', 'WEAPON1': '0.050', 'AMMO3': '0.110', 'AMMO4': '0.120', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'weapon4': '0.156', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.340', 'weapon3': '1.718'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:04,045][63770] DAMAGECOUNT value on done: 9810.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:04,046][63770] Sum rewards: -3.169, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.566', 'AMMO2': '0.015', 'WEAPON1': '0.020', 'weapon5': '0.024', 'AMMO5': '0.028', 'AMMO4': '0.076', 'AMMO3': '0.133', 'HITCOUNT': '0.330', 'WEAPON5': '0.500', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.065', 'weapon2': '1.216', 'FRAGCOUNT': '2.000', 'weapon3': '2.340'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:04,201][63767] DAMAGECOUNT value on done: 12938.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:04,203][63767] Sum rewards: -2.353, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.580', 'AMMO2': '0.002', 'weapon5': '0.006', 'AMMO5': '0.007', 'AMMO4': '0.008', 'WEAPON1': '0.020', 'HITCOUNT': '0.070', 'ARMOR': '0.080', 'WEAPON5': '0.150', 'AMMO3': '0.162', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.700', 'weapon2': '1.642', 'weapon3': '1.990', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:05,559][63734] DAMAGECOUNT value on done: 13146.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:05,559][63734] Sum rewards: -2.853, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.016', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'AMMO5': '0.005', 'WEAPON5': '0.100', 'ARMOR': '0.132', 'HITCOUNT': '0.190', 'AMMO3': '0.192', 'WEAPON4': '0.200', 'weapon4': '0.374', 'DAMAGECOUNT': '0.678', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.284', 'weapon3': '1.510'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:05,973][63734] DAMAGECOUNT value on done: 10983.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:05,974][63734] Sum rewards: -2.384, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.777', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.024', 'weapon5': '0.034', 'weapon7': '0.048', 'ARMOR': '0.052', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.137', 'WEAPON5': '0.150', 'HITCOUNT': '0.320', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.101', 'weapon2': '1.282', 'weapon3': '2.132'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:07,182][63733] Updated weights for policy 1, policy_version 2000 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:07,345][63805] DAMAGECOUNT value on done: 12780.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:07,345][63805] Sum rewards: -2.050, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.226', 'AMMO4': '-0.017', 'AMMO2': '-0.003', 'AMMO5': '0.007', 'weapon5': '0.010', 'WEAPON1': '0.030', 'weapon7': '0.070', 'AMMO3': '0.101', 'HITCOUNT': '0.110', 'WEAPON5': '0.150', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'ARMOR': '0.440', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.466', 'weapon2': '1.732'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:07,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11127.5, 300 sec: 11260.5). Total num frames: 16494592. Throughput: 0: 829.6, 1: 1940.2. Samples: 4117376. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:07,460][109198] Avg episode reward: [(0, '-0.467'), (1, '-2.616')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:07,467][63576] Saving new best policy, reward=-2.616!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:07,646][63734] DAMAGECOUNT value on done: 11501.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:07,647][63734] Sum rewards: 1.367, reward structure: {'DEATHCOUNT': '-5.250', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO2': '0.006', 'AMMO4': '0.032', 'WEAPON5': '0.050', 'HEALTH': '0.078', 'AMMO3': '0.109', 'HITCOUNT': '0.140', 'ARMOR': '0.440', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.555', 'FRAGCOUNT': '1.000', 'weapon3': '1.524', 'weapon2': '2.228'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:07,771][63805] DAMAGECOUNT value on done: 10531.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:07,771][63805] Sum rewards: -3.020, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.656', 'AMMO5': '0.009', 'AMMO2': '0.010', 'WEAPON1': '0.030', 'ARMOR': '0.032', 'AMMO4': '0.051', 'weapon5': '0.052', 'weapon4': '0.066', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'AMMO3': '0.124', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.432', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.654', 'weapon2': '1.686'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:08,033][63734] DAMAGECOUNT value on done: 11872.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:08,034][63734] Sum rewards: -1.417, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.830', 'AMMO2': '0.006', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'weapon5': '0.028', 'AMMO4': '0.028', 'AMMO3': '0.153', 'WEAPON5': '0.250', 'HITCOUNT': '0.300', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.933', 'weapon3': '1.810', 'weapon2': '1.822', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:08,174][63769] DAMAGECOUNT value on done: 12611.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:08,175][63769] Sum rewards: 2.441, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.444', 'AMMO4': '-0.030', 'AMMO2': '-0.006', 'ARMOR': '0.008', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'weapon7': '0.050', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.153', 'weapon5': '0.190', 'WEAPON7': '0.200', 'WEAPON5': '0.300', 'HITCOUNT': '0.340', 'WEAPON3': '0.650', 'weapon2': '1.130', 'DAMAGECOUNT': '2.004', 'weapon3': '2.134', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:08,588][63769] DAMAGECOUNT value on done: 8856.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:08,588][63769] Sum rewards: -2.510, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.648', 'AMMO2': '0.003', 'AMMO5': '0.012', 'AMMO4': '0.017', 'WEAPON1': '0.040', 'HITCOUNT': '0.050', 'AMMO3': '0.135', 'weapon5': '0.228', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.378', 'ARMOR': '0.440', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.022', 'weapon3': '1.362'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:11,152][63732] Updated weights for policy 0, policy_version 2030 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:12,355][63733] Updated weights for policy 1, policy_version 2010 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:12,452][63769] DAMAGECOUNT value on done: 12030.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:12,452][63769] Sum rewards: -3.545, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.082', 'AMMO4': '-0.017', 'AMMO2': '-0.003', 'weapon5': '0.006', 'AMMO5': '0.018', 'WEAPON1': '0.030', 'ARMOR': '0.084', 'AMMO3': '0.155', 'HITCOUNT': '0.190', 'WEAPON5': '0.350', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.915', 'weapon2': '1.468', 'weapon3': '1.942', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:12,459][109198] Fps is (10 sec: 11057.9, 60 sec: 11195.5, 300 sec: 11260.5). Total num frames: 16551936. Throughput: 0: 810.6, 1: 1951.1. Samples: 4133899. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:12,461][109198] Avg episode reward: [(0, '-0.462'), (1, '-2.529')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:12,462][63576] Saving new best policy, reward=-2.529!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:12,839][63769] DAMAGECOUNT value on done: 11356.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:12,840][63769] Sum rewards: -2.750, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.375', 'weapon5': '0.002', 'AMMO2': '0.014', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'AMMO4': '0.069', 'AMMO3': '0.161', 'HITCOUNT': '0.170', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.412', 'weapon3': '2.254'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:13,283][63767] DAMAGECOUNT value on done: 13957.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:13,284][63767] Sum rewards: -5.421, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.334', 'AMMO2': '0.003', 'AMMO4': '0.014', 'AMMO5': '0.017', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'weapon5': '0.050', 'AMMO3': '0.110', 'HITCOUNT': '0.180', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.648', 'WEAPON3': '0.700', 'weapon3': '1.512', 'weapon2': '1.898', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:13,655][63767] DAMAGECOUNT value on done: 16302.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:13,656][63767] Sum rewards: -1.413, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.442', 'AMMO2': '0.011', 'AMMO5': '0.012', 'weapon5': '0.042', 'WEAPON1': '0.050', 'AMMO4': '0.057', 'ARMOR': '0.072', 'AMMO3': '0.088', 'WEAPON4': '0.100', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.837', 'FRAGCOUNT': '1.000', 'weapon2': '1.586', 'weapon3': '1.754'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:14,289][63771] DAMAGECOUNT value on done: 11149.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:14,290][63771] Sum rewards: -5.854, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-3.044', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'weapon5': '0.074', 'ARMOR': '0.076', 'WEAPON5': '0.100', 'AMMO3': '0.172', 'HITCOUNT': '0.280', 'DAMAGECOUNT': '1.023', 'WEAPON3': '1.150', 'weapon2': '1.598', 'weapon3': '1.968', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:14,692][63771] DAMAGECOUNT value on done: 13951.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:14,692][63771] Sum rewards: -2.149, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.260', 'ARMOR': '0.008', 'WEAPON1': '0.010', 'AMMO2': '0.022', 'HITCOUNT': '0.090', 'AMMO3': '0.105', 'AMMO4': '0.111', 'weapon4': '0.178', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.288', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.596', 'weapon2': '1.752'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:15,346][63770] DAMAGECOUNT value on done: 10556.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:15,347][63770] Sum rewards: 0.413, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.764', 'AMMO2': '0.010', 'weapon5': '0.016', 'AMMO5': '0.020', 'WEAPON1': '0.030', 'AMMO4': '0.049', 'ARMOR': '0.080', 'HITCOUNT': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.102', 'weapon4': '0.192', 'DAMAGECOUNT': '0.390', 'WEAPON5': '0.400', 'WEAPON3': '0.600', 'weapon3': '1.282', 'weapon2': '1.826', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:15,754][63770] DAMAGECOUNT value on done: 12782.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:15,755][63770] Sum rewards: -5.528, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.600', 'AMMO5': '0.010', 'AMMO2': '0.013', 'ARMOR': '0.045', 'AMMO4': '0.065', 'weapon5': '0.068', 'WEAPON1': '0.070', 'AMMO3': '0.151', 'WEAPON5': '0.250', 'HITCOUNT': '0.370', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.050', 'weapon2': '1.254', 'weapon3': '2.176'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:17,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11059.2, 300 sec: 11274.4). Total num frames: 16605184. Throughput: 0: 815.6, 1: 1944.3. Samples: 4142249. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:17,460][109198] Avg episode reward: [(0, '-0.525'), (1, '-2.548')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:17,688][63733] Updated weights for policy 1, policy_version 2020 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:19,599][63805] DAMAGECOUNT value on done: 13887.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:19,599][63805] Sum rewards: -2.039, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.312', 'AMMO2': '0.008', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.042', 'WEAPON4': '0.050', 'AMMO3': '0.110', 'weapon4': '0.148', 'WEAPON5': '0.150', 'HITCOUNT': '0.270', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.840', 'FRAGCOUNT': '1.000', 'weapon3': '1.502', 'weapon2': '1.788'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:20,007][63805] DAMAGECOUNT value on done: 14683.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:21,325][63806] DAMAGECOUNT value on done: 11639.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:21,326][63806] Sum rewards: -2.268, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.994', 'AMMO2': '0.000', 'AMMO4': '0.002', 'AMMO5': '0.010', 'ARMOR': '0.028', 'WEAPON1': '0.040', 'weapon5': '0.056', 'AMMO3': '0.093', 'WEAPON5': '0.200', 'HITCOUNT': '0.290', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.023', 'weapon3': '1.520', 'FRAGCOUNT': '2.000', 'weapon2': '2.014'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:21,724][63806] DAMAGECOUNT value on done: 11314.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:21,786][63806] DAMAGECOUNT value on done: 11767.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:21,786][63806] Sum rewards: -6.161, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.770', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.031', 'AMMO2': '-0.006', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.080', 'weapon5': '0.130', 'AMMO3': '0.178', 'WEAPON5': '0.300', 'HITCOUNT': '0.310', 'WEAPON3': '1.100', 'DAMAGECOUNT': '1.122', 'weapon2': '1.360', 'weapon3': '2.040'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:22,138][63806] DAMAGECOUNT value on done: 11732.0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:22,458][109198] Fps is (10 sec: 11060.5, 60 sec: 11127.5, 300 sec: 11288.3). Total num frames: 16662528. Throughput: 0: 830.5, 1: 1936.9. Samples: 4159200. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:22,460][109198] Avg episode reward: [(0, '-0.515'), (1, '-2.563')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:22,865][63732] Updated weights for policy 0, policy_version 2040 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:22,998][63733] Updated weights for policy 1, policy_version 2030 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:23,823][63735] DAMAGECOUNT value on done: 10868.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:24,236][63735] DAMAGECOUNT value on done: 13077.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:24,236][63735] Sum rewards: -8.533, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-3.120', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.007', 'WEAPON5': '0.150', 'AMMO3': '0.234', 'HITCOUNT': '0.310', 'DAMAGECOUNT': '1.080', 'WEAPON3': '1.400', 'weapon2': '1.614', 'FRAGCOUNT': '2.000', 'weapon3': '2.054'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:24,252][63735] DAMAGECOUNT value on done: 14343.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:24,253][63735] Sum rewards: -0.662, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.610', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'weapon5': '0.028', 'AMMO3': '0.139', 'WEAPON5': '0.150', 'HITCOUNT': '0.200', 'ARMOR': '0.489', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.080', 'weapon2': '1.252', 'weapon3': '1.950', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:24,311][63771] DAMAGECOUNT value on done: 12011.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:24,312][63771] Sum rewards: -2.216, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.934', 'AMMO5': '0.005', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.059', 'WEAPON5': '0.100', 'weapon4': '0.130', 'WEAPON4': '0.150', 'AMMO3': '0.153', 'HITCOUNT': '0.170', 'ARMOR': '0.574', 'DAMAGECOUNT': '0.627', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.332', 'weapon3': '1.686'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:24,665][63735] DAMAGECOUNT value on done: 9487.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:24,666][63735] Sum rewards: -5.564, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.910', 'AMMO2': '0.014', 'WEAPON1': '0.040', 'AMMO4': '0.071', 'HITCOUNT': '0.130', 'AMMO3': '0.191', 'DAMAGECOUNT': '0.570', 'WEAPON3': '1.000', 'weapon2': '1.510', 'weapon3': '2.070', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:24,724][63771] DAMAGECOUNT value on done: 9778.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:24,724][63771] Sum rewards: 2.295, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO5': '0.003', 'weapon5': '0.016', 'WEAPON1': '0.020', 'AMMO2': '0.025', 'WEAPON5': '0.050', 'ARMOR': '0.076', 'HEALTH': '0.088', 'AMMO3': '0.098', 'AMMO4': '0.125', 'weapon4': '0.144', 'WEAPON4': '0.150', 'HITCOUNT': '0.310', 'WEAPON3': '0.550', 'DAMAGECOUNT': '1.050', 'weapon3': '1.558', 'weapon2': '1.782', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:27,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11059.2, 300 sec: 11288.3). Total num frames: 16715776. Throughput: 0: 842.5, 1: 1925.0. Samples: 4175975. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:27,460][109198] Avg episode reward: [(0, '-0.572'), (1, '-2.578')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:27,881][63767] DAMAGECOUNT value on done: 13698.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:27,881][63767] Sum rewards: 0.510, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.060', 'weapon4': '0.002', 'AMMO5': '0.007', 'AMMO2': '0.012', 'weapon5': '0.026', 'WEAPON1': '0.030', 'AMMO4': '0.062', 'ARMOR': '0.068', 'WEAPON4': '0.100', 'AMMO3': '0.111', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.179', 'weapon2': '1.598', 'weapon3': '1.824', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:27,886][63734] DAMAGECOUNT value on done: 13455.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:27,886][63734] Sum rewards: -2.012, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.116', 'AMMO5': '0.003', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'weapon5': '0.034', 'AMMO4': '0.035', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO3': '0.126', 'ARMOR': '0.128', 'weapon4': '0.212', 'HITCOUNT': '0.260', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.927', 'FRAGCOUNT': '1.000', 'weapon2': '1.220', 'weapon3': '1.692'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:28,206][63767] DAMAGECOUNT value on done: 13088.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:28,241][63734] DAMAGECOUNT value on done: 11358.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:28,242][63734] Sum rewards: -5.473, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.965', 'FRAGCOUNT': '-0.500', 'ARMOR': '0.008', 'WEAPON1': '0.010', 'AMMO2': '0.014', 'AMMO5': '0.020', 'weapon5': '0.026', 'AMMO4': '0.071', 'WEAPON4': '0.150', 'AMMO3': '0.156', 'weapon4': '0.252', 'HITCOUNT': '0.280', 'WEAPON5': '0.400', 'WEAPON3': '0.900', 'weapon2': '0.986', 'DAMAGECOUNT': '1.125', 'weapon3': '2.094'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:28,337][63733] Updated weights for policy 1, policy_version 2040 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:29,164][63770] DAMAGECOUNT value on done: 14253.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:29,164][63770] Sum rewards: -2.478, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.750', 'AMMO2': '0.004', 'AMMO5': '0.017', 'AMMO4': '0.019', 'weapon5': '0.030', 'weapon7': '0.096', 'AMMO3': '0.124', 'HITCOUNT': '0.210', 'AMMO6': '0.220', 'AMMO7': '0.220', 'WEAPON5': '0.250', 'WEAPON7': '0.300', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.789', 'WEAPON3': '0.850', 'weapon2': '1.160', 'weapon3': '1.984'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:29,537][63770] DAMAGECOUNT value on done: 10073.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:29,537][63770] Sum rewards: 1.190, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.010', 'weapon4': '0.012', 'weapon5': '0.024', 'ARMOR': '0.039', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.050', 'AMMO3': '0.070', 'HITCOUNT': '0.180', 'WEAPON3': '0.350', 'HEALTH': '0.432', 'DAMAGECOUNT': '0.789', 'FRAGCOUNT': '1.000', 'weapon3': '1.456', 'weapon2': '1.912'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:30,066][63805] Large shaping reward 2.640 for [('FRAGCOUNT', 2.0, 2.0), ('HITCOUNT', 0.04, 4.0), ('DAMAGECOUNT', 0.6, 200)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:30,380][63769] DAMAGECOUNT value on done: 13153.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:30,381][63769] Sum rewards: 2.567, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.005', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'ARMOR': '0.024', 'AMMO4': '0.036', 'weapon5': '0.036', 'HEALTH': '0.037', 'WEAPON5': '0.050', 'AMMO3': '0.106', 'HITCOUNT': '0.370', 'WEAPON3': '0.650', 'weapon2': '1.156', 'DAMAGECOUNT': '1.626', 'weapon3': '1.954', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:30,735][63769] DAMAGECOUNT value on done: 9251.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:30,736][63769] Sum rewards: 2.460, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.356', 'AMMO5': '0.017', 'AMMO2': '0.018', 'WEAPON1': '0.070', 'ARMOR': '0.076', 'AMMO4': '0.090', 'WEAPON4': '0.100', 'weapon4': '0.136', 'AMMO3': '0.150', 'weapon5': '0.204', 'HITCOUNT': '0.280', 'WEAPON5': '0.350', 'weapon2': '0.732', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.185', 'weapon3': '2.158', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:31,160][63805] DAMAGECOUNT value on done: 13025.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:31,161][63805] Sum rewards: 1.400, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.766', 'WEAPON1': '0.010', 'AMMO2': '0.010', 'AMMO5': '0.013', 'weapon4': '0.022', 'WEAPON4': '0.050', 'AMMO4': '0.051', 'weapon5': '0.062', 'AMMO3': '0.085', 'WEAPON5': '0.150', 'HITCOUNT': '0.180', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.735', 'weapon2': '1.608', 'weapon3': '1.890', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:31,553][63805] DAMAGECOUNT value on done: 10671.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:31,553][63805] Sum rewards: -3.491, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.960', 'AMMO5': '0.009', 'weapon4': '0.012', 'WEAPON1': '0.020', 'AMMO2': '0.025', 'ARMOR': '0.040', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.125', 'weapon5': '0.126', 'AMMO3': '0.127', 'DAMAGECOUNT': '0.420', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.800', 'weapon3': '1.582', 'weapon2': '1.632'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:31,797][63734] DAMAGECOUNT value on done: 11867.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:31,797][63734] Sum rewards: -0.730, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.075', 'AMMO2': '0.009', 'AMMO4': '0.042', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO3': '0.088', 'weapon4': '0.248', 'HITCOUNT': '0.260', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.098', 'weapon3': '1.586', 'FRAGCOUNT': '2.000', 'weapon2': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:32,198][63734] DAMAGECOUNT value on done: 11947.0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:32,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11059.2, 300 sec: 11274.4). Total num frames: 16773120. Throughput: 0: 846.5, 1: 1921.8. Samples: 4184382. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:32,459][109198] Avg episode reward: [(0, '-0.599'), (1, '-2.526')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:32,461][63576] Saving new best policy, reward=-2.526!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:33,671][63733] Updated weights for policy 1, policy_version 2050 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:34,600][63732] Updated weights for policy 0, policy_version 2050 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:37,091][63767] DAMAGECOUNT value on done: 14112.0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:37,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11195.7, 300 sec: 11274.4). Total num frames: 16830464. Throughput: 0: 847.6, 1: 1920.5. Samples: 4201036. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:37,460][109198] Avg episode reward: [(0, '-0.599'), (1, '-2.489')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:37,467][63576] Saving new best policy, reward=-2.489!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:37,475][63767] DAMAGECOUNT value on done: 16482.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:37,475][63767] Sum rewards: -7.726, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.978', 'AMMO2': '0.008', 'WEAPON1': '0.040', 'AMMO4': '0.040', 'AMMO3': '0.143', 'HITCOUNT': '0.180', 'ARMOR': '0.484', 'DAMAGECOUNT': '0.540', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '1.674', 'weapon2': '1.942'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:37,571][63769] DAMAGECOUNT value on done: 12388.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:37,571][63769] Sum rewards: -1.564, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.434', 'AMMO2': '0.004', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.021', 'weapon5': '0.088', 'AMMO3': '0.138', 'HITCOUNT': '0.200', 'WEAPON5': '0.300', 'ARMOR': '0.420', 'WEAPON3': '0.850', 'weapon2': '1.004', 'DAMAGECOUNT': '1.074', 'weapon3': '1.986', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:37,959][63769] DAMAGECOUNT value on done: 11396.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:37,959][63769] Sum rewards: -0.305, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.222', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.011', 'WEAPON1': '0.040', 'HITCOUNT': '0.050', 'AMMO4': '0.056', 'ARMOR': '0.080', 'AMMO3': '0.097', 'DAMAGECOUNT': '0.120', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'weapon4': '0.400', 'WEAPON3': '0.650', 'weapon3': '1.328', 'weapon2': '1.716', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:38,144][63771] DAMAGECOUNT value on done: 11184.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:38,522][63771] DAMAGECOUNT value on done: 14066.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:39,000][63733] Updated weights for policy 1, policy_version 2060 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:40,722][63770] DAMAGECOUNT value on done: 10659.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:41,131][63770] DAMAGECOUNT value on done: 12964.0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:42,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11127.5, 300 sec: 11274.4). Total num frames: 16883712. Throughput: 0: 849.1, 1: 1932.4. Samples: 4217944. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:42,460][109198] Avg episode reward: [(0, '-0.691'), (1, '-2.536')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:43,381][63805] DAMAGECOUNT value on done: 14167.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:43,382][63805] Sum rewards: -0.393, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.843', 'AMMO5': '0.010', 'AMMO2': '0.011', 'WEAPON1': '0.050', 'AMMO4': '0.054', 'weapon5': '0.078', 'ARMOR': '0.080', 'AMMO3': '0.087', 'WEAPON4': '0.150', 'HITCOUNT': '0.160', 'weapon4': '0.168', 'WEAPON5': '0.200', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.840', 'weapon2': '1.266', 'weapon3': '1.946', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:43,760][63805] DAMAGECOUNT value on done: 15173.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:43,761][63805] Sum rewards: 2.963, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.270', 'AMMO4': '-0.041', 'AMMO2': '-0.008', 'weapon5': '0.004', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO3': '0.061', 'ARMOR': '0.073', 'weapon7': '0.080', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.210', 'WEAPON3': '0.450', 'DAMAGECOUNT': '1.302', 'weapon3': '1.456', 'weapon2': '1.976', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:44,164][63733] Updated weights for policy 1, policy_version 2070 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:45,294][63806] DAMAGECOUNT value on done: 11694.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:45,295][63806] Sum rewards: 2.125, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.560', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.024', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'AMMO3': '0.098', 'weapon4': '0.100', 'AMMO4': '0.119', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'HITCOUNT': '0.360', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.140', 'weapon3': '1.648', 'weapon2': '1.658', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:45,681][63806] DAMAGECOUNT value on done: 11992.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:45,681][63806] Sum rewards: 1.262, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.005', 'AMMO2': '0.012', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'AMMO4': '0.059', 'AMMO3': '0.060', 'weapon4': '0.062', 'WEAPON5': '0.100', 'weapon5': '0.136', 'HEALTH': '0.178', 'HITCOUNT': '0.180', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.780', 'weapon3': '1.416', 'weapon2': '1.794', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:46,062][63806] DAMAGECOUNT value on done: 11819.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:46,062][63806] Sum rewards: -0.717, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.480', 'AMMO4': '-0.008', 'AMMO2': '-0.002', 'AMMO5': '0.009', 'weapon5': '0.030', 'WEAPON1': '0.040', 'ARMOR': '0.045', 'AMMO3': '0.093', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.540', 'FRAGCOUNT': '1.000', 'weapon3': '1.274', 'weapon2': '1.940'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:46,420][63806] DAMAGECOUNT value on done: 12025.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:46,421][63806] Sum rewards: -5.894, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.972', 'AMMO2': '0.002', 'AMMO4': '0.009', 'AMMO5': '0.015', 'weapon5': '0.034', 'ARMOR': '0.052', 'AMMO3': '0.187', 'HITCOUNT': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.729', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.306', 'weapon3': '2.244'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:46,572][63732] Updated weights for policy 0, policy_version 2060 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:47,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11127.5, 300 sec: 11274.4). Total num frames: 16941056. Throughput: 0: 848.2, 1: 1941.8. Samples: 4226396. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:47,460][109198] Avg episode reward: [(0, '-0.755'), (1, '-2.279')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:47,467][63576] Saving new best policy, reward=-2.279!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:47,564][63735] DAMAGECOUNT value on done: 13283.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:47,565][63735] Sum rewards: 0.871, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.187', 'WEAPON1': '0.010', 'AMMO2': '0.036', 'AMMO3': '0.097', 'ARMOR': '0.108', 'HITCOUNT': '0.180', 'AMMO4': '0.181', 'WEAPON4': '0.300', 'WEAPON3': '0.300', 'weapon4': '0.318', 'DAMAGECOUNT': '0.618', 'weapon3': '1.004', 'weapon2': '1.906', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:47,952][63735] DAMAGECOUNT value on done: 9542.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:47,952][63735] Sum rewards: -2.648, reward structure: {'DEATHCOUNT': '-5.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.430', 'AMMO5': '0.010', 'AMMO2': '0.017', 'WEAPON1': '0.040', 'HITCOUNT': '0.050', 'AMMO3': '0.060', 'ARMOR': '0.066', 'AMMO4': '0.082', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.165', 'weapon5': '0.190', 'WEAPON5': '0.200', 'weapon4': '0.362', 'WEAPON3': '0.450', 'weapon2': '1.320', 'weapon3': '1.370'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:48,551][63735] DAMAGECOUNT value on done: 10928.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:48,927][63735] DAMAGECOUNT value on done: 14881.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:48,927][63735] Sum rewards: -0.944, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.074', 'AMMO4': '-0.017', 'AMMO2': '-0.003', 'WEAPON1': '0.010', 'AMMO5': '0.010', 'ARMOR': '0.036', 'weapon7': '0.080', 'weapon5': '0.096', 'WEAPON4': '0.100', 'weapon4': '0.104', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.144', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'HITCOUNT': '0.400', 'WEAPON3': '0.900', 'weapon2': '0.928', 'DAMAGECOUNT': '1.614', 'FRAGCOUNT': '2.000', 'weapon3': '2.038'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:49,271][63733] Updated weights for policy 1, policy_version 2080 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:49,399][63771] DAMAGECOUNT value on done: 12246.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:49,399][63771] Sum rewards: -6.233, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.282', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'AMMO5': '0.010', 'ARMOR': '0.068', 'weapon5': '0.114', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'AMMO3': '0.214', 'DAMAGECOUNT': '0.705', 'WEAPON3': '1.000', 'weapon2': '1.754', 'weapon3': '1.798', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:49,789][63771] DAMAGECOUNT value on done: 9882.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:49,790][63771] Sum rewards: -7.464, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.582', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'weapon5': '0.004', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'ARMOR': '0.064', 'HITCOUNT': '0.100', 'AMMO3': '0.111', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.312', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.670', 'weapon2': '1.996'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:49,863][63734] DAMAGECOUNT value on done: 13828.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:49,863][63734] Sum rewards: -1.524, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.098', 'AMMO2': '0.003', 'AMMO5': '0.014', 'AMMO4': '0.015', 'WEAPON1': '0.040', 'WEAPON4': '0.100', 'AMMO3': '0.110', 'HITCOUNT': '0.160', 'weapon5': '0.168', 'weapon4': '0.240', 'WEAPON5': '0.300', 'ARMOR': '0.468', 'WEAPON3': '0.700', 'weapon2': '1.094', 'DAMAGECOUNT': '1.119', 'weapon3': '1.542', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:50,195][63734] DAMAGECOUNT value on done: 11563.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:50,196][63734] Sum rewards: -0.892, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.432', 'AMMO5': '0.003', 'weapon5': '0.006', 'ARMOR': '0.012', 'AMMO2': '0.013', 'WEAPON1': '0.040', 'weapon4': '0.044', 'WEAPON5': '0.050', 'AMMO4': '0.065', 'WEAPON4': '0.100', 'AMMO3': '0.156', 'HITCOUNT': '0.200', 'DAMAGECOUNT': '0.615', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.340', 'weapon3': '1.896'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:51,538][63767] DAMAGECOUNT value on done: 13883.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:51,539][63767] Sum rewards: -0.890, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.528', 'AMMO2': '0.007', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO4': '0.034', 'WEAPON4': '0.050', 'ARMOR': '0.084', 'weapon5': '0.102', 'weapon4': '0.120', 'AMMO3': '0.122', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.850', 'weapon2': '1.380', 'weapon3': '1.996', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:51,928][63767] DAMAGECOUNT value on done: 13450.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:51,928][63767] Sum rewards: -4.531, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.212', 'AMMO2': '0.011', 'WEAPON1': '0.020', 'AMMO5': '0.020', 'AMMO4': '0.054', 'ARMOR': '0.057', 'weapon5': '0.086', 'weapon4': '0.094', 'WEAPON4': '0.100', 'AMMO3': '0.125', 'HITCOUNT': '0.200', 'WEAPON5': '0.350', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.086', 'weapon2': '1.426', 'weapon3': '1.652'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:52,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11127.5, 300 sec: 11274.4). Total num frames: 16998400. Throughput: 0: 851.3, 1: 1948.4. Samples: 4243363. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:52,460][109198] Avg episode reward: [(0, '-0.868'), (1, '-2.420')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:52,569][63769] DAMAGECOUNT value on done: 13543.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:52,569][63769] Sum rewards: 2.584, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.990', 'ARMOR': '0.016', 'AMMO2': '0.023', 'AMMO5': '0.024', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'AMMO4': '0.115', 'AMMO3': '0.130', 'weapon4': '0.212', 'weapon5': '0.218', 'HITCOUNT': '0.290', 'WEAPON5': '0.350', 'WEAPON3': '0.750', 'weapon2': '0.794', 'DAMAGECOUNT': '1.170', 'weapon3': '1.902', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:52,923][63769] DAMAGECOUNT value on done: 9561.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:52,924][63769] Sum rewards: -1.077, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.500', 'AMMO5': '0.007', 'AMMO2': '0.015', 'ARMOR': '0.020', 'weapon5': '0.034', 'WEAPON5': '0.050', 'AMMO4': '0.073', 'weapon7': '0.082', 'AMMO3': '0.120', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.250', 'weapon4': '0.368', 'weapon2': '0.726', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.930', 'FRAGCOUNT': '1.000', 'weapon3': '2.058'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:54,239][63733] Updated weights for policy 1, policy_version 2090 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:54,473][63770] DAMAGECOUNT value on done: 14423.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:54,881][63770] DAMAGECOUNT value on done: 10448.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:54,881][63770] Sum rewards: -3.901, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.568', 'AMMO4': '-0.047', 'AMMO2': '-0.009', 'AMMO5': '0.008', 'ARMOR': '0.064', 'weapon5': '0.100', 'AMMO3': '0.172', 'WEAPON5': '0.200', 'HITCOUNT': '0.310', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.125', 'weapon2': '1.458', 'weapon3': '1.986', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:54,959][63805] DAMAGECOUNT value on done: 13349.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:54,959][63805] Sum rewards: -2.177, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.460', 'AMMO2': '0.010', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'weapon5': '0.022', 'AMMO4': '0.047', 'weapon4': '0.074', 'ARMOR': '0.094', 'AMMO3': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'HITCOUNT': '0.240', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.972', 'weapon2': '1.568', 'weapon3': '1.924', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:55,338][63805] DAMAGECOUNT value on done: 10821.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:55,339][63805] Sum rewards: -6.591, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-3.008', 'weapon5': '0.002', 'AMMO2': '0.006', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.029', 'HITCOUNT': '0.100', 'WEAPON5': '0.150', 'AMMO3': '0.171', 'ARMOR': '0.448', 'DAMAGECOUNT': '0.450', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.200', 'weapon2': '1.270', 'weapon3': '2.064'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:55,483][63734] DAMAGECOUNT value on done: 12027.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:55,874][63734] DAMAGECOUNT value on done: 12248.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:55,875][63734] Sum rewards: -1.135, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.046', 'AMMO2': '0.007', 'AMMO5': '0.010', 'AMMO4': '0.034', 'WEAPON1': '0.080', 'AMMO3': '0.091', 'weapon5': '0.148', 'HITCOUNT': '0.190', 'WEAPON5': '0.300', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.903', 'weapon3': '1.592', 'weapon2': '1.606', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:57,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11195.7, 300 sec: 11274.4). Total num frames: 17055744. Throughput: 0: 852.9, 1: 1954.4. Samples: 4260226. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:01:57,460][109198] Avg episode reward: [(0, '-0.894'), (1, '-2.483')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:59,300][63732] Updated weights for policy 0, policy_version 2070 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:01:59,474][63733] Updated weights for policy 1, policy_version 2100 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:00,691][63767] DAMAGECOUNT value on done: 14497.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:00,691][63767] Sum rewards: 2.867, reward structure: {'DEATHCOUNT': '-5.250', 'weapon4': '0.008', 'AMMO5': '0.017', 'AMMO2': '0.022', 'ARMOR': '0.036', 'WEAPON1': '0.060', 'AMMO3': '0.071', 'WEAPON4': '0.100', 'AMMO4': '0.109', 'HEALTH': '0.160', 'HITCOUNT': '0.190', 'weapon5': '0.206', 'WEAPON5': '0.350', 'WEAPON3': '0.450', 'DAMAGECOUNT': '1.155', 'weapon3': '1.586', 'weapon2': '1.596', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:01,124][63767] DAMAGECOUNT value on done: 16817.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:01,125][63767] Sum rewards: -3.633, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.616', 'weapon5': '0.002', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'AMMO5': '0.013', 'AMMO4': '0.037', 'ARMOR': '0.040', 'WEAPON5': '0.150', 'AMMO3': '0.181', 'HITCOUNT': '0.220', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.005', 'weapon2': '1.300', 'weapon3': '2.118', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:02,337][63771] DAMAGECOUNT value on done: 11423.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:02,337][63771] Sum rewards: -1.119, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.527', 'AMMO5': '0.005', 'AMMO2': '0.022', 'weapon5': '0.060', 'WEAPON5': '0.100', 'ARMOR': '0.109', 'AMMO4': '0.109', 'AMMO3': '0.120', 'HITCOUNT': '0.160', 'WEAPON4': '0.300', 'weapon4': '0.344', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.717', 'weapon2': '1.564', 'weapon3': '1.698', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:02,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11127.5, 300 sec: 11274.4). Total num frames: 17108992. Throughput: 0: 847.1, 1: 1959.7. Samples: 4268554. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:02,460][109198] Avg episode reward: [(0, '-0.894'), (1, '-2.417')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:02,735][63771] DAMAGECOUNT value on done: 14140.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:02,807][63769] DAMAGECOUNT value on done: 12690.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:02,807][63769] Sum rewards: -2.725, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.896', 'AMMO2': '0.007', 'weapon5': '0.014', 'AMMO5': '0.015', 'AMMO4': '0.035', 'WEAPON1': '0.040', 'weapon7': '0.068', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.155', 'WEAPON7': '0.200', 'HITCOUNT': '0.240', 'WEAPON5': '0.300', 'ARMOR': '0.461', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.906', 'weapon2': '1.110', 'FRAGCOUNT': '2.000', 'weapon3': '2.230'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:03,132][63769] DAMAGECOUNT value on done: 11515.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:04,672][63733] Updated weights for policy 1, policy_version 2110 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:05,073][63770] DAMAGECOUNT value on done: 10884.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:05,073][63770] Sum rewards: -1.707, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.593', 'AMMO5': '0.005', 'weapon4': '0.006', 'AMMO2': '0.023', 'ARMOR': '0.024', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'AMMO4': '0.113', 'AMMO3': '0.142', 'HITCOUNT': '0.180', 'weapon5': '0.198', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.900', 'weapon2': '1.244', 'FRAGCOUNT': '2.000', 'weapon3': '2.196'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:05,473][63770] DAMAGECOUNT value on done: 13311.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:05,473][63770] Sum rewards: -2.423, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.108', 'AMMO5': '0.010', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.061', 'ARMOR': '0.088', 'weapon4': '0.092', 'AMMO3': '0.124', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'HITCOUNT': '0.250', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.041', 'weapon2': '1.638', 'weapon3': '1.848', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:07,117][63805] DAMAGECOUNT value on done: 14272.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:07,117][63805] Sum rewards: -2.396, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.426', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO2': '0.031', 'ARMOR': '0.068', 'HITCOUNT': '0.070', 'weapon5': '0.080', 'AMMO3': '0.121', 'WEAPON5': '0.150', 'AMMO4': '0.157', 'weapon4': '0.248', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.800', 'weapon2': '1.198', 'weapon3': '1.764', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:07,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11195.7, 300 sec: 11274.4). Total num frames: 17166336. Throughput: 0: 832.6, 1: 1965.9. Samples: 4285133. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:07,460][109198] Avg episode reward: [(0, '-0.886'), (1, '-2.511')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:07,515][63805] DAMAGECOUNT value on done: 15368.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:07,515][63805] Sum rewards: -5.361, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.946', 'AMMO5': '0.013', 'AMMO2': '0.014', 'WEAPON1': '0.030', 'AMMO4': '0.068', 'ARMOR': '0.072', 'weapon5': '0.124', 'AMMO3': '0.168', 'HITCOUNT': '0.210', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.585', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon2': '1.450', 'weapon3': '2.052'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:08,852][63806] DAMAGECOUNT value on done: 11829.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:09,226][63806] DAMAGECOUNT value on done: 12332.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:09,226][63806] Sum rewards: -2.422, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.216', 'AMMO5': '0.007', 'AMMO2': '0.022', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'weapon5': '0.054', 'weapon4': '0.076', 'AMMO4': '0.107', 'ARMOR': '0.112', 'AMMO3': '0.125', 'WEAPON5': '0.150', 'HITCOUNT': '0.360', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.020', 'weapon2': '1.590', 'weapon3': '1.840', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:09,728][63733] Updated weights for policy 1, policy_version 2120 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:10,628][63806] DAMAGECOUNT value on done: 12061.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:10,628][63806] Sum rewards: 3.656, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.034', 'AMMO5': '0.005', 'AMMO2': '0.007', 'weapon5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.034', 'AMMO3': '0.094', 'WEAPON5': '0.100', 'ARMOR': '0.104', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'weapon4': '0.488', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.726', 'weapon2': '1.528', 'weapon3': '1.552', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:11,080][63806] DAMAGECOUNT value on done: 12120.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:11,081][63806] Sum rewards: -4.288, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.735', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.008', 'AMMO5': '0.015', 'AMMO4': '0.037', 'ARMOR': '0.044', 'HITCOUNT': '0.110', 'weapon5': '0.116', 'AMMO3': '0.126', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.750', 'weapon2': '1.504', 'weapon3': '1.952'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:11,646][63735] DAMAGECOUNT value on done: 13318.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:11,646][63735] Sum rewards: -3.993, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.670', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO2': '0.020', 'HITCOUNT': '0.030', 'weapon4': '0.044', 'AMMO4': '0.102', 'AMMO3': '0.102', 'DAMAGECOUNT': '0.105', 'ARMOR': '0.120', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'weapon5': '0.232', 'WEAPON3': '0.650', 'weapon2': '1.402', 'weapon3': '1.742'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:11,979][63734] DAMAGECOUNT value on done: 14054.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:11,980][63734] Sum rewards: -0.584, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.804', 'AMMO2': '0.002', 'AMMO4': '0.012', 'AMMO5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.035', 'weapon5': '0.046', 'AMMO3': '0.108', 'HITCOUNT': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.678', 'weapon2': '1.458', 'weapon3': '1.546', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:12,004][63735] DAMAGECOUNT value on done: 9664.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:12,005][63735] Sum rewards: -0.750, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.621', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'AMMO3': '0.063', 'HITCOUNT': '0.110', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.366', 'FRAGCOUNT': '1.000', 'weapon3': '1.054', 'weapon2': '1.438'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:12,141][63732] Updated weights for policy 0, policy_version 2080 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:12,356][63734] DAMAGECOUNT value on done: 11934.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:12,356][63734] Sum rewards: -3.324, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.226', 'AMMO5': '0.010', 'AMMO2': '0.014', 'AMMO4': '0.071', 'ARMOR': '0.100', 'weapon5': '0.126', 'WEAPON4': '0.150', 'AMMO3': '0.163', 'HITCOUNT': '0.200', 'WEAPON5': '0.250', 'weapon4': '0.334', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.113', 'weapon2': '1.452', 'weapon3': '1.518', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:12,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11195.9, 300 sec: 11274.4). Total num frames: 17223680. Throughput: 0: 824.3, 1: 1980.8. Samples: 4302204. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:12,460][109198] Avg episode reward: [(0, '-0.922'), (1, '-2.434')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:13,621][63735] DAMAGECOUNT value on done: 11189.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:13,622][63735] Sum rewards: -4.657, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.806', 'AMMO5': '0.010', 'weapon5': '0.010', 'AMMO2': '0.016', 'WEAPON1': '0.020', 'ARMOR': '0.072', 'AMMO4': '0.079', 'AMMO3': '0.119', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.783', 'FRAGCOUNT': '1.000', 'weapon3': '1.198', 'weapon2': '2.262'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:14,004][63735] DAMAGECOUNT value on done: 15136.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:14,004][63735] Sum rewards: -1.960, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.660', 'AMMO4': '-0.043', 'AMMO2': '-0.009', 'WEAPON1': '0.020', 'AMMO5': '0.026', 'AMMO3': '0.131', 'weapon5': '0.170', 'HITCOUNT': '0.210', 'WEAPON5': '0.400', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.765', 'weapon3': '1.352', 'weapon2': '1.376', 'FRAGCOUNT': '1.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:14,519][63771] DAMAGECOUNT value on done: 12519.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:14,520][63771] Sum rewards: -3.133, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.896', 'AMMO2': '0.008', 'AMMO5': '0.015', 'WEAPON1': '0.030', 'AMMO4': '0.041', 'ARMOR': '0.068', 'WEAPON4': '0.100', 'weapon4': '0.136', 'weapon5': '0.138', 'AMMO3': '0.208', 'HITCOUNT': '0.240', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.819', 'WEAPON3': '0.900', 'weapon2': '1.240', 'FRAGCOUNT': '2.000', 'weapon3': '2.020'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:14,631][63769] DAMAGECOUNT value on done: 14241.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:14,632][63769] Sum rewards: -2.188, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.430', 'FRAGCOUNT': '0.000', 'weapon7': '0.004', 'AMMO2': '0.005', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.026', 'ARMOR': '0.040', 'WEAPON4': '0.100', 'AMMO3': '0.102', 'weapon4': '0.106', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.252', 'HITCOUNT': '0.290', 'WEAPON5': '0.350', 'WEAPON3': '0.650', 'weapon2': '1.080', 'weapon3': '1.760', 'DAMAGECOUNT': '2.094'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:14,801][63733] Updated weights for policy 1, policy_version 2130 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:14,976][63771] DAMAGECOUNT value on done: 10092.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:14,976][63771] Sum rewards: -2.533, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.668', 'AMMO5': '0.023', 'AMMO2': '0.028', 'WEAPON1': '0.040', 'AMMO3': '0.064', 'AMMO4': '0.140', 'weapon4': '0.142', 'WEAPON4': '0.150', 'HITCOUNT': '0.190', 'weapon5': '0.264', 'WEAPON5': '0.350', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.630', 'FRAGCOUNT': '1.000', 'weapon3': '1.476', 'weapon2': '1.588'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:15,000][63769] DAMAGECOUNT value on done: 9723.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:15,001][63769] Sum rewards: -3.400, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.980', 'AMMO2': '0.007', 'AMMO5': '0.017', 'WEAPON1': '0.030', 'AMMO4': '0.033', 'ARMOR': '0.040', 'HITCOUNT': '0.120', 'AMMO3': '0.139', 'weapon5': '0.290', 'WEAPON5': '0.450', 'DAMAGECOUNT': '0.486', 'WEAPON3': '0.900', 'weapon2': '1.118', 'weapon3': '1.950', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:15,109][63767] DAMAGECOUNT value on done: 14296.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:15,110][63767] Sum rewards: -1.805, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.370', 'AMMO5': '0.005', 'AMMO2': '0.022', 'weapon7': '0.072', 'ARMOR': '0.096', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.108', 'AMMO3': '0.111', 'WEAPON4': '0.150', 'weapon4': '0.224', 'HITCOUNT': '0.320', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.239', 'weapon2': '1.582', 'weapon3': '1.686'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:15,496][63767] DAMAGECOUNT value on done: 13580.0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:17,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11264.0, 300 sec: 11274.4). Total num frames: 17281024. Throughput: 0: 820.3, 1: 1985.3. Samples: 4310634. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:17,460][109198] Avg episode reward: [(0, '-0.966'), (1, '-2.457')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:18,579][63805] DAMAGECOUNT value on done: 13704.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:18,580][63805] Sum rewards: 1.712, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.482', 'AMMO5': '0.005', 'AMMO2': '0.006', 'AMMO4': '0.029', 'weapon4': '0.060', 'AMMO3': '0.095', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'ARMOR': '0.104', 'HITCOUNT': '0.260', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.065', 'weapon3': '1.332', 'weapon2': '2.188', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:18,991][63805] DAMAGECOUNT value on done: 10995.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:18,991][63805] Sum rewards: -1.159, reward structure: {'DEATHCOUNT': '-5.250', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.318', 'AMMO5': '0.006', 'AMMO2': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.034', 'WEAPON4': '0.050', 'ARMOR': '0.076', 'weapon4': '0.094', 'AMMO3': '0.098', 'weapon5': '0.148', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.522', 'WEAPON3': '0.600', 'weapon2': '1.314', 'weapon3': '1.620'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:19,563][63734] DAMAGECOUNT value on done: 12252.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:19,683][63770] DAMAGECOUNT value on done: 14558.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:19,684][63770] Sum rewards: -4.432, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.737', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.007', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.036', 'ARMOR': '0.050', 'WEAPON4': '0.050', 'weapon5': '0.086', 'WEAPON5': '0.100', 'AMMO3': '0.121', 'HITCOUNT': '0.150', 'weapon4': '0.150', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.650', 'weapon3': '1.504', 'weapon2': '1.718'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:19,860][63733] Updated weights for policy 1, policy_version 2140 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:19,943][63734] DAMAGECOUNT value on done: 12288.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:20,103][63770] DAMAGECOUNT value on done: 10833.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:20,103][63770] Sum rewards: 1.270, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.001', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.018', 'ARMOR': '0.032', 'AMMO4': '0.088', 'WEAPON5': '0.100', 'AMMO3': '0.131', 'weapon5': '0.132', 'WEAPON4': '0.200', 'HITCOUNT': '0.260', 'weapon4': '0.374', 'WEAPON3': '0.650', 'weapon2': '0.714', 'DAMAGECOUNT': '1.155', 'FRAGCOUNT': '2.000', 'weapon3': '2.152'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:22,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11264.0, 300 sec: 11274.4). Total num frames: 17338368. Throughput: 0: 812.6, 1: 2001.6. Samples: 4327675. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:22,459][109198] Avg episode reward: [(0, '-0.945'), (1, '-2.406')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:24,146][63767] DAMAGECOUNT value on done: 14707.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:24,147][63767] Sum rewards: 0.632, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.140', 'AMMO5': '0.010', 'AMMO2': '0.013', 'AMMO4': '0.064', 'weapon5': '0.068', 'WEAPON1': '0.070', 'AMMO3': '0.079', 'HITCOUNT': '0.150', 'WEAPON5': '0.200', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.630', 'FRAGCOUNT': '1.000', 'weapon3': '1.492', 'weapon2': '1.696'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:24,530][63767] DAMAGECOUNT value on done: 17108.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:24,530][63767] Sum rewards: 0.040, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.158', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.013', 'AMMO4': '0.066', 'weapon5': '0.078', 'WEAPON4': '0.100', 'ARMOR': '0.116', 'AMMO3': '0.136', 'WEAPON5': '0.150', 'HITCOUNT': '0.260', 'weapon4': '0.362', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.873', 'weapon3': '1.150', 'weapon2': '1.524', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:24,851][63733] Updated weights for policy 1, policy_version 2150 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:24,888][63732] Updated weights for policy 0, policy_version 2090 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:26,234][63771] DAMAGECOUNT value on done: 11563.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:26,235][63771] Sum rewards: -1.880, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.140', 'AMMO5': '0.007', 'AMMO2': '0.008', 'AMMO4': '0.042', 'ARMOR': '0.052', 'weapon5': '0.066', 'weapon4': '0.078', 'HITCOUNT': '0.090', 'AMMO3': '0.106', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.600', 'weapon3': '1.406', 'weapon2': '1.584', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:26,496][63735] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:26,641][63771] DAMAGECOUNT value on done: 14265.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:26,641][63771] Sum rewards: 1.121, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.952', 'AMMO5': '0.003', 'AMMO2': '0.015', 'ARMOR': '0.034', 'weapon7': '0.050', 'AMMO3': '0.060', 'AMMO4': '0.072', 'HITCOUNT': '0.110', 'weapon4': '0.154', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.375', 'weapon3': '1.018', 'weapon2': '1.662', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:27,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11332.3, 300 sec: 11274.4). Total num frames: 17395712. Throughput: 0: 803.8, 1: 2013.0. Samples: 4344703. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:27,460][109198] Avg episode reward: [(0, '-0.945'), (1, '-2.247')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:27,466][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000002155_8826880.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:27,466][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002092_8568832.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:27,526][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001741_7131136.pth\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:27,527][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001846_7561216.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:27,534][63576] Saving new best policy, reward=-2.247!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:27,663][63769] DAMAGECOUNT value on done: 13249.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:27,663][63769] Sum rewards: -0.348, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.476', 'AMMO2': '0.002', 'AMMO4': '0.008', 'AMMO5': '0.027', 'WEAPON1': '0.040', 'AMMO3': '0.147', 'weapon5': '0.296', 'HITCOUNT': '0.340', 'WEAPON5': '0.550', 'WEAPON3': '0.750', 'weapon2': '1.442', 'DAMAGECOUNT': '1.677', 'weapon3': '1.848', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:28,088][63769] DAMAGECOUNT value on done: 11850.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:28,088][63769] Sum rewards: -1.230, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.100', 'AMMO2': '0.014', 'AMMO5': '0.015', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'weapon4': '0.050', 'AMMO4': '0.072', 'ARMOR': '0.088', 'AMMO3': '0.098', 'weapon5': '0.102', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'WEAPON3': '0.450', 'DAMAGECOUNT': '1.005', 'weapon3': '1.426', 'FRAGCOUNT': '1.500', 'weapon2': '1.750'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:29,001][63770] DAMAGECOUNT value on done: 10954.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:29,378][63770] DAMAGECOUNT value on done: 13608.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:29,378][63770] Sum rewards: -1.957, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.760', 'AMMO2': '0.004', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'ARMOR': '0.016', 'AMMO4': '0.022', 'weapon5': '0.040', 'WEAPON5': '0.050', 'AMMO3': '0.164', 'HITCOUNT': '0.260', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.891', 'weapon3': '1.470', 'weapon2': '1.918', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:29,917][63733] Updated weights for policy 1, policy_version 2160 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:30,651][63805] DAMAGECOUNT value on done: 14307.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:31,047][63805] DAMAGECOUNT value on done: 15623.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:31,048][63805] Sum rewards: -6.425, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.926', 'AMMO2': '0.008', 'AMMO4': '0.039', 'WEAPON4': '0.100', 'AMMO3': '0.159', 'HITCOUNT': '0.190', 'weapon4': '0.244', 'ARMOR': '0.588', 'DAMAGECOUNT': '0.765', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.390', 'weapon3': '1.468'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:32,069][63806] DAMAGECOUNT value on done: 11994.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:32,070][63806] Sum rewards: -10.252, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-3.680', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'AMMO5': '0.020', 'weapon5': '0.028', 'ARMOR': '0.092', 'HITCOUNT': '0.170', 'AMMO3': '0.236', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.495', 'FRAGCOUNT': '1.000', 'weapon2': '1.226', 'WEAPON3': '1.400', 'weapon3': '1.992'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:32,388][63806] DAMAGECOUNT value on done: 12417.0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:32,458][109198] Fps is (10 sec: 10649.5, 60 sec: 11195.7, 300 sec: 11260.5). Total num frames: 17444864. Throughput: 0: 801.5, 1: 2015.4. Samples: 4353157. Policy #0 lag: (min: 0.0, avg: 0.1, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:32,460][109198] Avg episode reward: [(0, '-0.948'), (1, '-2.433')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:34,011][63734] DAMAGECOUNT value on done: 14559.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:34,012][63734] Sum rewards: 4.967, reward structure: {'DEATHCOUNT': '-4.500', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.013', 'ARMOR': '0.036', 'AMMO4': '0.064', 'AMMO3': '0.077', 'HEALTH': '0.144', 'WEAPON5': '0.150', 'HITCOUNT': '0.150', 'weapon5': '0.166', 'WEAPON3': '0.300', 'weapon2': '1.388', 'weapon3': '1.446', 'DAMAGECOUNT': '1.515', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:34,375][63734] DAMAGECOUNT value on done: 12638.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:34,376][63734] Sum rewards: -1.896, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.572', 'weapon7': '0.008', 'AMMO2': '0.010', 'AMMO5': '0.014', 'AMMO4': '0.052', 'ARMOR': '0.068', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.144', 'AMMO3': '0.190', 'weapon5': '0.204', 'WEAPON5': '0.350', 'HITCOUNT': '0.480', 'weapon2': '1.036', 'WEAPON3': '1.150', 'DAMAGECOUNT': '2.112', 'weapon3': '2.208', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:34,834][63806] DAMAGECOUNT value on done: 12243.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:34,834][63806] Sum rewards: -9.430, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-2.327', 'AMMO5': '0.007', 'AMMO2': '0.019', 'WEAPON1': '0.020', 'weapon4': '0.052', 'AMMO4': '0.094', 'HITCOUNT': '0.130', 'WEAPON5': '0.150', 'AMMO3': '0.177', 'WEAPON4': '0.250', 'ARMOR': '0.497', 'DAMAGECOUNT': '0.546', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.494', 'weapon3': '1.760'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:35,014][63733] Updated weights for policy 1, policy_version 2170 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:35,196][63735] DAMAGECOUNT value on done: 13613.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:35,196][63735] Sum rewards: -0.227, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.569', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.022', 'WEAPON5': '0.050', 'ARMOR': '0.056', 'weapon4': '0.066', 'AMMO3': '0.099', 'WEAPON4': '0.100', 'AMMO4': '0.109', 'HITCOUNT': '0.210', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.885', 'FRAGCOUNT': '1.000', 'weapon2': '1.538', 'weapon3': '1.644'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:35,205][63806] DAMAGECOUNT value on done: 12461.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:35,205][63806] Sum rewards: -2.540, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.051', 'AMMO2': '0.014', 'AMMO5': '0.015', 'ARMOR': '0.016', 'WEAPON1': '0.030', 'AMMO4': '0.068', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'weapon4': '0.116', 'HITCOUNT': '0.170', 'weapon5': '0.260', 'WEAPON5': '0.350', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.951', 'weapon2': '1.484', 'weapon3': '1.824'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:35,576][63735] DAMAGECOUNT value on done: 9779.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:35,576][63735] Sum rewards: -3.141, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.026', 'AMMO5': '0.005', 'AMMO2': '0.007', 'weapon5': '0.010', 'WEAPON1': '0.020', 'AMMO4': '0.034', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.132', 'ARMOR': '0.148', 'WEAPON4': '0.150', 'weapon4': '0.204', 'DAMAGECOUNT': '0.345', 'WEAPON3': '0.700', 'weapon3': '1.426', 'weapon2': '1.494', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:36,577][63769] DAMAGECOUNT value on done: 14424.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:36,577][63769] Sum rewards: -1.374, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.140', 'AMMO2': '0.005', 'weapon4': '0.016', 'AMMO5': '0.017', 'AMMO4': '0.023', 'WEAPON1': '0.030', 'ARMOR': '0.030', 'WEAPON4': '0.100', 'AMMO3': '0.144', 'HITCOUNT': '0.190', 'weapon5': '0.250', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.549', 'WEAPON3': '0.850', 'weapon2': '1.132', 'weapon3': '2.080', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:36,890][63769] DAMAGECOUNT value on done: 9943.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:36,890][63769] Sum rewards: 0.297, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO5': '0.005', 'AMMO2': '0.021', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'weapon5': '0.092', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO4': '0.103', 'AMMO3': '0.118', 'weapon7': '0.122', 'weapon4': '0.204', 'HITCOUNT': '0.210', 'HEALTH': '0.228', 'ARMOR': '0.424', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.660', 'weapon2': '1.152', 'weapon3': '1.358', 'FRAGCOUNT': '1.500'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:37,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11264.0, 300 sec: 11274.4). Total num frames: 17506304. Throughput: 0: 804.1, 1: 2017.6. Samples: 4370339. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:37,460][109198] Avg episode reward: [(0, '-0.948'), (1, '-2.580')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:37,472][63732] Updated weights for policy 0, policy_version 2100 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:37,944][63735] DAMAGECOUNT value on done: 11426.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:37,945][63735] Sum rewards: -1.696, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.904', 'AMMO2': '0.001', 'AMMO5': '0.004', 'AMMO4': '0.006', 'ARMOR': '0.040', 'weapon5': '0.044', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.140', 'HITCOUNT': '0.150', 'weapon4': '0.240', 'DAMAGECOUNT': '0.711', 'WEAPON3': '0.800', 'weapon2': '0.964', 'weapon3': '1.908', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:38,348][63735] DAMAGECOUNT value on done: 15301.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:38,348][63735] Sum rewards: -1.909, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.797', 'AMMO4': '-0.030', 'AMMO2': '-0.006', 'WEAPON4': '0.050', 'ARMOR': '0.080', 'AMMO3': '0.115', 'HITCOUNT': '0.190', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.354', 'weapon3': '1.840'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:38,847][63767] DAMAGECOUNT value on done: 14448.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:39,237][63767] DAMAGECOUNT value on done: 13784.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:39,238][63767] Sum rewards: -4.448, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.732', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO2': '0.017', 'ARMOR': '0.036', 'WEAPON5': '0.050', 'weapon4': '0.056', 'AMMO4': '0.083', 'AMMO3': '0.136', 'HITCOUNT': '0.160', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.612', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.102', 'weapon3': '1.928'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:39,369][63771] DAMAGECOUNT value on done: 12852.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:39,369][63771] Sum rewards: -4.008, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.812', 'AMMO2': '0.005', 'AMMO5': '0.008', 'WEAPON1': '0.010', 'weapon5': '0.026', 'AMMO4': '0.026', 'ARMOR': '0.051', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'AMMO3': '0.151', 'weapon4': '0.152', 'HITCOUNT': '0.320', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.999', 'weapon2': '1.620', 'weapon3': '1.736', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:39,756][63771] DAMAGECOUNT value on done: 10112.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:39,756][63771] Sum rewards: -5.713, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.724', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'AMMO5': '0.018', 'HITCOUNT': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.054', 'DAMAGECOUNT': '0.060', 'AMMO3': '0.130', 'WEAPON5': '0.300', 'weapon5': '0.388', 'WEAPON3': '0.700', 'weapon2': '1.436', 'weapon3': '1.602'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:40,055][63733] Updated weights for policy 1, policy_version 2180 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:42,058][63805] DAMAGECOUNT value on done: 13876.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:42,059][63805] Sum rewards: -0.263, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.414', 'AMMO2': '0.005', 'WEAPON1': '0.010', 'AMMO4': '0.027', 'AMMO3': '0.092', 'HITCOUNT': '0.140', 'ARMOR': '0.497', 'DAMAGECOUNT': '0.516', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.582', 'weapon2': '1.732'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:42,409][63805] DAMAGECOUNT value on done: 11155.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:42,410][63805] Sum rewards: -4.815, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.290', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'ARMOR': '0.024', 'weapon4': '0.032', 'weapon5': '0.032', 'AMMO2': '0.040', 'WEAPON5': '0.050', 'HITCOUNT': '0.120', 'AMMO3': '0.135', 'AMMO4': '0.199', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.442', 'weapon3': '1.708'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:42,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11264.0, 300 sec: 11260.5). Total num frames: 17559552. Throughput: 0: 804.3, 1: 2016.8. Samples: 4387176. Policy #0 lag: (min: 0.0, avg: 0.1, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:42,460][109198] Avg episode reward: [(0, '-1.037'), (1, '-2.677')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:43,375][63734] DAMAGECOUNT value on done: 12568.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:43,376][63734] Sum rewards: -0.781, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.317', 'weapon5': '0.002', 'AMMO5': '0.007', 'AMMO2': '0.016', 'WEAPON1': '0.020', 'weapon4': '0.052', 'AMMO4': '0.080', 'AMMO3': '0.114', 'ARMOR': '0.116', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.240', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.948', 'weapon2': '1.424', 'weapon3': '1.816', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:43,759][63734] DAMAGECOUNT value on done: 12470.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:43,760][63734] Sum rewards: -0.756, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.792', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'weapon5': '0.002', 'AMMO5': '0.005', 'weapon4': '0.012', 'WEAPON4': '0.050', 'AMMO3': '0.098', 'WEAPON5': '0.100', 'ARMOR': '0.104', 'HITCOUNT': '0.110', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.546', 'weapon3': '1.566', 'weapon2': '1.700', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:44,697][63770] DAMAGECOUNT value on done: 14698.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:44,697][63770] Sum rewards: -8.123, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.107', 'WEAPON1': '0.010', 'AMMO5': '0.010', 'AMMO2': '0.019', 'ARMOR': '0.060', 'weapon5': '0.086', 'AMMO4': '0.095', 'weapon4': '0.124', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'AMMO3': '0.156', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.900', 'weapon3': '1.284', 'weapon2': '1.890', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:45,042][63770] DAMAGECOUNT value on done: 11168.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:45,043][63770] Sum rewards: 2.220, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.035', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO3': '0.093', 'WEAPON4': '0.100', 'weapon5': '0.158', 'HITCOUNT': '0.190', 'weapon4': '0.198', 'WEAPON5': '0.200', 'ARMOR': '0.511', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.005', 'weapon2': '1.294', 'weapon3': '1.640', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:45,141][63733] Updated weights for policy 1, policy_version 2190 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:47,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11264.0, 300 sec: 11260.5). Total num frames: 17616896. Throughput: 0: 806.7, 1: 2016.7. Samples: 4395605. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:47,460][109198] Avg episode reward: [(0, '-1.036'), (1, '-2.656')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:48,249][63767] DAMAGECOUNT value on done: 14911.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:48,249][63767] Sum rewards: -2.253, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.322', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'WEAPON5': '0.100', 'ARMOR': '0.104', 'AMMO3': '0.133', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.612', 'WEAPON3': '0.850', 'weapon2': '1.578', 'weapon3': '1.772', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:48,606][63767] DAMAGECOUNT value on done: 17413.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:48,607][63767] Sum rewards: -0.090, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.500', 'AMMO2': '0.005', 'WEAPON1': '0.010', 'AMMO4': '0.025', 'WEAPON4': '0.050', 'ARMOR': '0.072', 'AMMO3': '0.079', 'weapon4': '0.104', 'HITCOUNT': '0.270', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.915', 'weapon2': '1.482', 'weapon3': '1.598', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:50,284][63733] Updated weights for policy 1, policy_version 2200 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:50,305][63732] Updated weights for policy 0, policy_version 2110 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:50,390][63771] DAMAGECOUNT value on done: 11778.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:50,391][63771] Sum rewards: -0.304, reward structure: {'DEATHCOUNT': '-6.750', 'weapon5': '0.006', 'AMMO5': '0.007', 'AMMO2': '0.010', 'AMMO4': '0.049', 'AMMO3': '0.070', 'WEAPON4': '0.100', 'weapon4': '0.132', 'ARMOR': '0.139', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'WEAPON3': '0.350', 'HEALTH': '0.606', 'DAMAGECOUNT': '0.645', 'FRAGCOUNT': '1.000', 'weapon3': '1.510', 'weapon2': '1.522'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:50,779][63771] DAMAGECOUNT value on done: 14530.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:50,780][63771] Sum rewards: -4.145, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.749', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.014', 'ARMOR': '0.053', 'AMMO4': '0.069', 'weapon4': '0.072', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.125', 'HITCOUNT': '0.210', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.795', 'FRAGCOUNT': '1.000', 'weapon2': '1.620', 'weapon3': '1.678'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:52,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11264.0, 300 sec: 11260.5). Total num frames: 17674240. Throughput: 0: 808.4, 1: 2022.3. Samples: 4412516. Policy #0 lag: (min: 0.0, avg: 0.1, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:52,460][109198] Avg episode reward: [(0, '-1.036'), (1, '-2.592')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:52,579][63769] DAMAGECOUNT value on done: 13374.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:52,580][63769] Sum rewards: -4.922, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-0.500', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'ARMOR': '0.020', 'AMMO2': '0.031', 'weapon7': '0.064', 'HITCOUNT': '0.080', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon4': '0.120', 'AMMO3': '0.131', 'weapon5': '0.146', 'WEAPON4': '0.150', 'AMMO4': '0.153', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.375', 'HEALTH': '0.420', 'WEAPON3': '0.650', 'weapon2': '1.174', 'weapon3': '1.936'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:53,024][63769] DAMAGECOUNT value on done: 12095.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:53,024][63769] Sum rewards: -3.861, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.424', 'AMMO5': '0.003', 'weapon5': '0.006', 'AMMO2': '0.019', 'WEAPON5': '0.050', 'ARMOR': '0.080', 'AMMO4': '0.093', 'weapon4': '0.096', 'AMMO3': '0.159', 'WEAPON4': '0.200', 'HITCOUNT': '0.230', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.735', 'FRAGCOUNT': '1.000', 'weapon2': '1.298', 'weapon3': '1.644'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:53,054][63770] DAMAGECOUNT value on done: 11097.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:53,054][63770] Sum rewards: 1.323, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-1.152', 'AMMO2': '0.007', 'AMMO5': '0.013', 'ARMOR': '0.036', 'AMMO4': '0.037', 'WEAPON4': '0.050', 'AMMO3': '0.060', 'weapon4': '0.068', 'HITCOUNT': '0.090', 'weapon7': '0.104', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'weapon5': '0.326', 'DAMAGECOUNT': '0.429', 'WEAPON3': '0.450', 'weapon3': '1.094', 'weapon2': '1.520', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:53,440][63770] DAMAGECOUNT value on done: 13760.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:54,088][63805] DAMAGECOUNT value on done: 14502.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:54,089][63805] Sum rewards: 0.488, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.346', 'WEAPON1': '0.010', 'AMMO5': '0.013', 'AMMO2': '0.018', 'weapon4': '0.040', 'weapon5': '0.078', 'AMMO4': '0.087', 'WEAPON4': '0.100', 'AMMO3': '0.115', 'HITCOUNT': '0.190', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.585', 'ARMOR': '0.588', 'WEAPON3': '0.650', 'weapon2': '1.330', 'weapon3': '1.530', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:54,483][63805] DAMAGECOUNT value on done: 15763.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:54,484][63805] Sum rewards: -1.960, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.261', 'AMMO2': '0.026', 'weapon4': '0.036', 'AMMO4': '0.128', 'AMMO3': '0.139', 'HITCOUNT': '0.140', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.420', 'ARMOR': '0.490', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.694', 'weapon2': '1.778'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:55,345][63733] Updated weights for policy 1, policy_version 2210 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:55,560][63806] DAMAGECOUNT value on done: 12469.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:55,560][63806] Sum rewards: -2.427, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.733', 'AMMO5': '0.007', 'AMMO2': '0.008', 'ARMOR': '0.024', 'AMMO4': '0.042', 'WEAPON5': '0.100', 'AMMO3': '0.175', 'HITCOUNT': '0.380', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.425', 'weapon2': '1.444', 'weapon3': '1.950', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:55,895][63734] DAMAGECOUNT value on done: 14843.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:55,896][63734] Sum rewards: 2.862, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-0.441', 'AMMO5': '0.003', 'AMMO2': '0.011', 'weapon4': '0.030', 'WEAPON5': '0.050', 'AMMO4': '0.053', 'weapon5': '0.062', 'ARMOR': '0.064', 'WEAPON4': '0.100', 'AMMO3': '0.122', 'HITCOUNT': '0.210', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.852', 'weapon2': '1.168', 'weapon3': '1.878', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:55,960][63806] DAMAGECOUNT value on done: 12762.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:55,960][63806] Sum rewards: -1.761, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.006', 'weapon5': '0.004', 'AMMO2': '0.005', 'AMMO5': '0.020', 'AMMO4': '0.026', 'ARMOR': '0.068', 'WEAPON4': '0.150', 'AMMO3': '0.155', 'WEAPON5': '0.200', 'weapon4': '0.214', 'HITCOUNT': '0.290', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.035', 'weapon2': '1.418', 'weapon3': '1.760', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:56,214][63734] DAMAGECOUNT value on done: 12808.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:56,215][63734] Sum rewards: -0.850, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.955', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'weapon7': '0.054', 'weapon5': '0.072', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.140', 'weapon4': '0.158', 'HITCOUNT': '0.170', 'WEAPON7': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.402', 'weapon3': '1.670'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:57,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11264.0, 300 sec: 11260.5). Total num frames: 17731584. Throughput: 0: 806.0, 1: 2019.5. Samples: 4429354. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:02:57,459][109198] Avg episode reward: [(0, '-1.020'), (1, '-2.564')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:58,830][63769] DAMAGECOUNT value on done: 14693.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:58,831][63769] Sum rewards: -0.621, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.472', 'AMMO5': '0.005', 'AMMO2': '0.012', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'AMMO4': '0.062', 'weapon5': '0.106', 'AMMO3': '0.121', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'weapon4': '0.272', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.807', 'weapon2': '1.350', 'weapon3': '1.452', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:58,974][63735] DAMAGECOUNT value on done: 13878.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:58,975][63735] Sum rewards: -2.380, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.786', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'weapon5': '0.010', 'AMMO2': '0.045', 'WEAPON5': '0.050', 'AMMO3': '0.135', 'ARMOR': '0.135', 'HITCOUNT': '0.190', 'AMMO4': '0.227', 'weapon4': '0.256', 'WEAPON4': '0.450', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.795', 'weapon2': '1.248', 'weapon3': '1.652', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:59,193][63769] DAMAGECOUNT value on done: 10398.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:59,193][63769] Sum rewards: 2.731, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.726', 'AMMO5': '0.007', 'AMMO2': '0.026', 'ARMOR': '0.036', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'weapon7': '0.090', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon4': '0.110', 'HITCOUNT': '0.120', 'AMMO3': '0.127', 'AMMO4': '0.128', 'WEAPON5': '0.200', 'weapon5': '0.206', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.909', 'weapon2': '1.150', 'weapon3': '1.658', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:59,299][63735] DAMAGECOUNT value on done: 10024.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:59,300][63735] Sum rewards: -0.880, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.240', 'AMMO4': '-0.028', 'AMMO2': '-0.006', 'ARMOR': '0.020', 'AMMO3': '0.122', 'HITCOUNT': '0.180', 'DAMAGECOUNT': '0.735', 'WEAPON3': '0.850', 'weapon2': '1.178', 'weapon3': '2.058', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:59,442][63806] DAMAGECOUNT value on done: 12333.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:59,779][63806] DAMAGECOUNT value on done: 12721.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:02:59,779][63806] Sum rewards: -3.862, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.161', 'AMMO5': '0.005', 'AMMO2': '0.009', 'weapon5': '0.020', 'AMMO4': '0.045', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'ARMOR': '0.132', 'AMMO3': '0.140', 'HITCOUNT': '0.260', 'weapon4': '0.348', 'DAMAGECOUNT': '0.780', 'WEAPON3': '0.950', 'weapon2': '1.344', 'weapon3': '1.816', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:00,429][63733] Updated weights for policy 1, policy_version 2220 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:02,458][109198] Fps is (10 sec: 11468.5, 60 sec: 11332.2, 300 sec: 11260.5). Total num frames: 17788928. Throughput: 0: 806.0, 1: 2019.3. Samples: 4437775. Policy #0 lag: (min: 0.0, avg: 0.1, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:02,460][109198] Avg episode reward: [(0, '-0.894'), (1, '-2.483')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:02,537][63767] DAMAGECOUNT value on done: 14518.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:02,537][63767] Sum rewards: -1.573, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.729', 'AMMO2': '0.001', 'AMMO5': '0.005', 'AMMO4': '0.005', 'WEAPON1': '0.020', 'weapon4': '0.026', 'weapon5': '0.040', 'WEAPON4': '0.050', 'HITCOUNT': '0.070', 'ARMOR': '0.077', 'WEAPON5': '0.100', 'AMMO3': '0.105', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.262', 'weapon2': '1.534'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:02,653][63735] DAMAGECOUNT value on done: 11633.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:02,653][63735] Sum rewards: -0.473, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.770', 'AMMO2': '0.012', 'AMMO4': '0.061', 'ARMOR': '0.116', 'AMMO3': '0.119', 'WEAPON4': '0.150', 'HITCOUNT': '0.200', 'weapon4': '0.388', 'DAMAGECOUNT': '0.621', 'WEAPON3': '0.700', 'weapon3': '1.252', 'weapon2': '1.428', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:02,838][63767] DAMAGECOUNT value on done: 13929.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:02,838][63767] Sum rewards: -0.701, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.007', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'weapon5': '0.038', 'AMMO4': '0.046', 'weapon4': '0.078', 'WEAPON4': '0.100', 'weapon7': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.115', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON5': '0.150', 'WEAPON7': '0.200', 'HEALTH': '0.264', 'ARMOR': '0.400', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.450', 'weapon2': '1.546'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:02,997][63732] Updated weights for policy 0, policy_version 2120 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:03,064][63735] DAMAGECOUNT value on done: 15791.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:03,064][63735] Sum rewards: -1.221, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.054', 'AMMO5': '0.013', 'AMMO2': '0.017', 'ARMOR': '0.044', 'weapon5': '0.070', 'AMMO4': '0.082', 'WEAPON4': '0.100', 'AMMO3': '0.151', 'WEAPON5': '0.200', 'weapon4': '0.234', 'HITCOUNT': '0.330', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.470', 'weapon3': '1.672', 'weapon2': '1.700', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:04,205][63771] DAMAGECOUNT value on done: 13233.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:04,205][63771] Sum rewards: -2.580, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.849', 'AMMO4': '-0.024', 'AMMO2': '-0.005', 'FRAGCOUNT': '0.000', 'AMMO5': '0.019', 'AMMO3': '0.103', 'weapon5': '0.172', 'HITCOUNT': '0.310', 'WEAPON5': '0.350', 'WEAPON3': '0.500', 'ARMOR': '0.532', 'DAMAGECOUNT': '1.143', 'weapon2': '1.588', 'weapon3': '1.830'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:04,669][63771] DAMAGECOUNT value on done: 10399.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:04,670][63771] Sum rewards: -3.080, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.815', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'AMMO5': '0.010', 'weapon5': '0.032', 'AMMO3': '0.139', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'ARMOR': '0.531', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.861', 'weapon2': '1.528', 'weapon3': '1.888', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:05,533][63733] Updated weights for policy 1, policy_version 2230 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:05,740][63805] DAMAGECOUNT value on done: 13891.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:06,125][63805] DAMAGECOUNT value on done: 11478.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:06,125][63805] Sum rewards: -3.120, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.110', 'weapon4': '0.002', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'AMMO4': '0.084', 'WEAPON4': '0.100', 'weapon5': '0.104', 'AMMO3': '0.114', 'HITCOUNT': '0.290', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.969', 'weapon3': '1.512', 'weapon2': '1.742', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:07,242][63734] DAMAGECOUNT value on done: 12850.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:07,243][63734] Sum rewards: -1.414, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.068', 'AMMO2': '0.004', 'AMMO4': '0.021', 'ARMOR': '0.040', 'AMMO3': '0.093', 'HITCOUNT': '0.200', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.846', 'weapon3': '1.648', 'weapon2': '1.702', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:07,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11264.0, 300 sec: 11260.5). Total num frames: 17842176. Throughput: 0: 805.6, 1: 2017.1. Samples: 4454699. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:07,460][109198] Avg episode reward: [(0, '-0.954'), (1, '-2.477')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:07,667][63734] DAMAGECOUNT value on done: 12575.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:07,668][63734] Sum rewards: 0.494, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-1.400', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.072', 'HITCOUNT': '0.080', 'AMMO3': '0.087', 'WEAPON4': '0.100', 'weapon4': '0.182', 'weapon5': '0.252', 'DAMAGECOUNT': '0.315', 'WEAPON5': '0.350', 'WEAPON3': '0.550', 'weapon3': '0.938', 'weapon2': '1.460', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:09,740][63770] DAMAGECOUNT value on done: 14918.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:09,740][63770] Sum rewards: -5.115, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.631', 'weapon4': '0.002', 'AMMO2': '0.011', 'AMMO5': '0.017', 'ARMOR': '0.040', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'AMMO4': '0.056', 'AMMO3': '0.167', 'HITCOUNT': '0.170', 'weapon5': '0.214', 'WEAPON5': '0.250', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.660', 'WEAPON3': '1.000', 'weapon2': '1.024', 'weapon3': '2.064'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:10,069][63770] DAMAGECOUNT value on done: 11697.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:10,070][63770] Sum rewards: 0.471, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.748', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'AMMO5': '0.014', 'weapon5': '0.090', 'WEAPON5': '0.100', 'ARMOR': '0.108', 'AMMO3': '0.158', 'WEAPON4': '0.200', 'weapon4': '0.216', 'HITCOUNT': '0.250', 'WEAPON3': '0.900', 'weapon2': '1.156', 'DAMAGECOUNT': '1.587', 'weapon3': '2.192', 'FRAGCOUNT': '3.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:10,724][63733] Updated weights for policy 1, policy_version 2240 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:11,854][63767] DAMAGECOUNT value on done: 15191.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:11,855][63767] Sum rewards: -1.637, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.577', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'ARMOR': '0.032', 'weapon5': '0.070', 'weapon7': '0.078', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.170', 'HITCOUNT': '0.210', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.840', 'weapon2': '1.552', 'weapon3': '1.638', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:12,222][63767] DAMAGECOUNT value on done: 17592.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:12,223][63767] Sum rewards: -5.589, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.459', 'AMMO2': '0.000', 'AMMO4': '0.002', 'AMMO5': '0.003', 'ARMOR': '0.020', 'WEAPON5': '0.050', 'weapon5': '0.074', 'HITCOUNT': '0.150', 'AMMO3': '0.162', 'DAMAGECOUNT': '0.537', 'WEAPON3': '1.050', 'weapon2': '1.260', 'FRAGCOUNT': '2.000', 'weapon3': '2.062'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:12,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11264.0, 300 sec: 11246.6). Total num frames: 17899520. Throughput: 0: 802.2, 1: 2007.6. Samples: 4471146. Policy #0 lag: (min: 0.0, avg: 0.1, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:12,460][109198] Avg episode reward: [(0, '-0.948'), (1, '-2.460')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:14,566][63771] DAMAGECOUNT value on done: 11912.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:14,567][63771] Sum rewards: -6.116, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.414', 'AMMO2': '0.005', 'WEAPON1': '0.010', 'AMMO5': '0.018', 'AMMO4': '0.024', 'ARMOR': '0.032', 'weapon4': '0.046', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'weapon5': '0.280', 'DAMAGECOUNT': '0.402', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.214', 'weapon2': '1.846'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:14,985][63771] DAMAGECOUNT value on done: 14712.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:14,985][63771] Sum rewards: -4.153, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.758', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO2': '0.010', 'AMMO4': '0.050', 'ARMOR': '0.068', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.124', 'AMMO3': '0.141', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.546', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.434', 'weapon3': '1.750'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:15,871][63733] Updated weights for policy 1, policy_version 2250 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:15,881][63732] Updated weights for policy 0, policy_version 2130 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:17,280][63770] DAMAGECOUNT value on done: 11287.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:17,281][63770] Sum rewards: -0.578, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.245', 'AMMO2': '0.007', 'AMMO5': '0.013', 'AMMO4': '0.035', 'WEAPON1': '0.050', 'ARMOR': '0.100', 'AMMO3': '0.106', 'HITCOUNT': '0.170', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.570', 'weapon5': '0.634', 'WEAPON3': '0.700', 'weapon2': '1.086', 'weapon3': '1.696', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:17,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11264.0, 300 sec: 11260.5). Total num frames: 17956864. Throughput: 0: 804.5, 1: 2006.5. Samples: 4479650. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:17,460][109198] Avg episode reward: [(0, '-0.948'), (1, '-2.517')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:17,564][63769] DAMAGECOUNT value on done: 13879.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:17,565][63769] Sum rewards: 1.929, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.398', 'AMMO5': '0.015', 'AMMO2': '0.018', 'ARMOR': '0.020', 'weapon7': '0.026', 'WEAPON1': '0.040', 'weapon5': '0.070', 'AMMO4': '0.089', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.120', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'weapon4': '0.312', 'HITCOUNT': '0.370', 'WEAPON3': '0.700', 'weapon2': '1.084', 'DAMAGECOUNT': '1.515', 'weapon3': '1.948', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:17,683][63770] DAMAGECOUNT value on done: 13891.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:17,957][63769] DAMAGECOUNT value on done: 12175.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:17,958][63769] Sum rewards: -3.773, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.690', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'AMMO5': '0.005', 'weapon5': '0.006', 'WEAPON1': '0.050', 'HITCOUNT': '0.090', 'AMMO3': '0.093', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.240', 'ARMOR': '0.456', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.730', 'weapon2': '1.828'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:17,968][63805] DAMAGECOUNT value on done: 14726.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:17,969][63805] Sum rewards: -5.343, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.495', 'AMMO2': '0.009', 'AMMO5': '0.011', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'AMMO4': '0.044', 'WEAPON4': '0.050', 'weapon5': '0.058', 'HITCOUNT': '0.160', 'AMMO3': '0.166', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.672', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.432', 'weapon3': '1.894'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:18,204][63734] DAMAGECOUNT value on done: 15323.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:18,205][63734] Sum rewards: 2.684, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.156', 'AMMO5': '0.007', 'AMMO2': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.048', 'ARMOR': '0.064', 'WEAPON4': '0.100', 'AMMO3': '0.103', 'WEAPON5': '0.150', 'weapon4': '0.194', 'HITCOUNT': '0.210', 'weapon5': '0.250', 'WEAPON3': '0.500', 'DAMAGECOUNT': '1.440', 'weapon2': '1.494', 'weapon3': '1.510', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:18,340][63805] DAMAGECOUNT value on done: 15963.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:18,340][63805] Sum rewards: -3.700, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.955', 'ARMOR': '0.012', 'AMMO2': '0.012', 'AMMO5': '0.013', 'WEAPON1': '0.040', 'AMMO4': '0.061', 'weapon4': '0.102', 'AMMO3': '0.127', 'HITCOUNT': '0.160', 'WEAPON4': '0.200', 'WEAPON6': '0.200', 'AMMO6': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.250', 'weapon5': '0.256', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.448', 'weapon2': '1.524'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:18,587][63734] DAMAGECOUNT value on done: 12965.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:19,664][63806] DAMAGECOUNT value on done: 12759.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:19,664][63806] Sum rewards: -2.251, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.954', 'weapon4': '0.002', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.013', 'ARMOR': '0.040', 'AMMO4': '0.065', 'WEAPON4': '0.100', 'AMMO3': '0.180', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'DAMAGECOUNT': '0.870', 'WEAPON3': '1.050', 'weapon2': '1.764', 'weapon3': '1.920', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:20,037][63806] DAMAGECOUNT value on done: 13107.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:20,038][63806] Sum rewards: 0.978, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.247', 'AMMO5': '0.006', 'AMMO2': '0.017', 'ARMOR': '0.024', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'weapon4': '0.050', 'weapon5': '0.066', 'AMMO4': '0.084', 'AMMO3': '0.097', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.035', 'weapon2': '1.382', 'weapon3': '1.774', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:20,926][63733] Updated weights for policy 1, policy_version 2260 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:21,039][63769] DAMAGECOUNT value on done: 14927.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:21,039][63769] Sum rewards: -0.463, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.434', 'AMMO2': '0.013', 'AMMO5': '0.014', 'AMMO4': '0.065', 'weapon7': '0.084', 'AMMO3': '0.098', 'HITCOUNT': '0.160', 'weapon5': '0.168', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'AMMO6': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.250', 'weapon4': '0.354', 'ARMOR': '0.486', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.702', 'weapon2': '1.114', 'weapon3': '1.412', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:21,381][63769] DAMAGECOUNT value on done: 10756.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:21,382][63769] Sum rewards: 0.802, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.092', 'AMMO5': '0.007', 'AMMO2': '0.016', 'AMMO4': '0.078', 'WEAPON5': '0.100', 'weapon5': '0.104', 'AMMO3': '0.113', 'WEAPON4': '0.150', 'HITCOUNT': '0.210', 'weapon4': '0.228', 'ARMOR': '0.538', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.074', 'weapon2': '1.566', 'weapon3': '1.710', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:22,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11264.0, 300 sec: 11260.5). Total num frames: 18014208. Throughput: 0: 801.8, 1: 2003.9. Samples: 4496596. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:22,460][109198] Avg episode reward: [(0, '-0.854'), (1, '-2.532')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:22,724][63735] DAMAGECOUNT value on done: 14148.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:22,724][63735] Sum rewards: -8.759, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-3.508', 'AMMO4': '-0.075', 'AMMO2': '-0.015', 'AMMO5': '0.005', 'weapon5': '0.028', 'ARMOR': '0.036', 'WEAPON5': '0.100', 'AMMO3': '0.178', 'HITCOUNT': '0.260', 'DAMAGECOUNT': '0.810', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.598', 'weapon3': '1.824'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:23,100][63735] DAMAGECOUNT value on done: 10278.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:23,101][63735] Sum rewards: -5.325, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.557', 'weapon4': '0.008', 'AMMO2': '0.012', 'AMMO5': '0.015', 'weapon5': '0.018', 'WEAPON1': '0.050', 'AMMO4': '0.059', 'ARMOR': '0.066', 'AMMO3': '0.120', 'WEAPON4': '0.150', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.762', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.330', 'weapon3': '1.872'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:23,978][63806] DAMAGECOUNT value on done: 12610.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:23,979][63806] Sum rewards: -1.307, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.807', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'AMMO5': '0.005', 'weapon5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.084', 'WEAPON5': '0.100', 'AMMO3': '0.129', 'HITCOUNT': '0.270', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.831', 'FRAGCOUNT': '1.000', 'weapon2': '1.414', 'weapon3': '1.686'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:24,355][63806] DAMAGECOUNT value on done: 13118.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:24,356][63806] Sum rewards: 3.509, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.844', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.028', 'weapon5': '0.102', 'AMMO3': '0.139', 'WEAPON5': '0.300', 'HITCOUNT': '0.300', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.191', 'weapon3': '1.526', 'weapon2': '1.888', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:26,027][63733] Updated weights for policy 1, policy_version 2270 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:26,358][63767] DAMAGECOUNT value on done: 14888.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:26,358][63767] Sum rewards: -4.512, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.855', 'weapon5': '0.002', 'AMMO2': '0.007', 'WEAPON1': '0.020', 'AMMO5': '0.020', 'AMMO4': '0.036', 'ARMOR': '0.060', 'AMMO3': '0.182', 'weapon4': '0.196', 'WEAPON4': '0.250', 'HITCOUNT': '0.280', 'WEAPON5': '0.300', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.110', 'weapon3': '1.610', 'weapon2': '1.720', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:26,769][63767] DAMAGECOUNT value on done: 14404.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:26,769][63767] Sum rewards: -0.241, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.870', 'AMMO5': '0.012', 'AMMO2': '0.022', 'ARMOR': '0.028', 'WEAPON1': '0.030', 'weapon4': '0.030', 'WEAPON4': '0.100', 'AMMO3': '0.103', 'AMMO4': '0.108', 'WEAPON5': '0.200', 'HITCOUNT': '0.260', 'weapon5': '0.352', 'WEAPON3': '0.550', 'weapon3': '1.262', 'DAMAGECOUNT': '1.425', 'weapon2': '1.646', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:27,116][63735] DAMAGECOUNT value on done: 11868.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:27,116][63735] Sum rewards: -1.839, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.810', 'AMMO2': '0.009', 'AMMO5': '0.014', 'WEAPON1': '0.030', 'AMMO4': '0.043', 'weapon5': '0.092', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'ARMOR': '0.108', 'weapon4': '0.156', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.705', 'FRAGCOUNT': '1.000', 'weapon3': '1.340', 'weapon2': '1.756'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:27,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11195.7, 300 sec: 11260.5). Total num frames: 18067456. Throughput: 0: 803.6, 1: 2000.1. Samples: 4513342. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:27,460][109198] Avg episode reward: [(0, '-0.842'), (1, '-2.707')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:27,528][63735] DAMAGECOUNT value on done: 16047.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:27,529][63735] Sum rewards: 0.113, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.444', 'AMMO2': '0.009', 'AMMO5': '0.012', 'AMMO4': '0.046', 'ARMOR': '0.052', 'weapon7': '0.076', 'weapon5': '0.098', 'WEAPON5': '0.100', 'AMMO3': '0.139', 'WEAPON4': '0.150', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'HITCOUNT': '0.230', 'weapon4': '0.286', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.768', 'weapon2': '1.050', 'weapon3': '1.870', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:28,274][63732] Updated weights for policy 0, policy_version 2140 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:29,436][63805] DAMAGECOUNT value on done: 14130.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:29,436][63805] Sum rewards: 1.013, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.820', 'AMMO5': '0.010', 'AMMO2': '0.033', 'weapon4': '0.048', 'WEAPON1': '0.060', 'AMMO3': '0.123', 'WEAPON4': '0.150', 'AMMO4': '0.166', 'WEAPON5': '0.200', 'HITCOUNT': '0.220', 'weapon5': '0.492', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.717', 'weapon2': '1.352', 'weapon3': '1.562', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:29,474][63771] DAMAGECOUNT value on done: 13656.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:29,475][63771] Sum rewards: -0.439, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.086', 'AMMO5': '0.017', 'AMMO2': '0.028', 'weapon7': '0.030', 'weapon4': '0.066', 'WEAPON4': '0.100', 'AMMO3': '0.132', 'AMMO4': '0.141', 'AMMO6': '0.160', 'AMMO7': '0.160', 'weapon5': '0.192', 'WEAPON7': '0.200', 'HITCOUNT': '0.210', 'WEAPON5': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '1.269', 'weapon2': '1.588', 'weapon3': '1.804', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:29,783][63805] DAMAGECOUNT value on done: 11933.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:29,783][63805] Sum rewards: -1.258, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.216', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'weapon5': '0.048', 'AMMO4': '0.086', 'WEAPON4': '0.100', 'weapon4': '0.120', 'WEAPON5': '0.150', 'AMMO3': '0.156', 'HITCOUNT': '0.300', 'WEAPON3': '0.900', 'weapon2': '1.226', 'DAMAGECOUNT': '1.365', 'weapon3': '2.222', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:29,829][63771] DAMAGECOUNT value on done: 10464.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:29,830][63771] Sum rewards: -3.459, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.162', 'AMMO5': '0.003', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'ARMOR': '0.020', 'AMMO4': '0.038', 'weapon5': '0.040', 'WEAPON5': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.149', 'DAMAGECOUNT': '0.195', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.662', 'weapon3': '1.668'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:31,452][63734] DAMAGECOUNT value on done: 12980.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:31,528][63733] Updated weights for policy 1, policy_version 2280 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:31,823][63734] DAMAGECOUNT value on done: 12959.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:31,823][63734] Sum rewards: -0.768, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.560', 'AMMO5': '0.003', 'AMMO2': '0.007', 'AMMO4': '0.033', 'WEAPON1': '0.040', 'WEAPON5': '0.050', 'AMMO3': '0.141', 'weapon5': '0.142', 'HITCOUNT': '0.360', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.152', 'weapon2': '1.518', 'weapon3': '1.796', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:32,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11332.3, 300 sec: 11260.5). Total num frames: 18124800. Throughput: 0: 813.4, 1: 1988.0. Samples: 4521666. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:32,460][109198] Avg episode reward: [(0, '-0.807'), (1, '-2.810')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:34,831][63770] DAMAGECOUNT value on done: 15027.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:35,182][63770] DAMAGECOUNT value on done: 12050.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:35,182][63770] Sum rewards: -1.785, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.716', 'AMMO5': '0.005', 'ARMOR': '0.012', 'AMMO2': '0.031', 'AMMO3': '0.115', 'weapon5': '0.142', 'AMMO4': '0.155', 'WEAPON5': '0.200', 'HITCOUNT': '0.280', 'WEAPON4': '0.450', 'weapon4': '0.634', 'WEAPON3': '0.650', 'weapon2': '1.020', 'DAMAGECOUNT': '1.059', 'weapon3': '1.428', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:35,432][63767] DAMAGECOUNT value on done: 15358.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:35,433][63767] Sum rewards: -3.272, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.262', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO2': '0.024', 'ARMOR': '0.060', 'weapon4': '0.086', 'AMMO4': '0.121', 'AMMO3': '0.130', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.501', 'WEAPON3': '0.750', 'weapon5': '0.758', 'weapon3': '1.150', 'weapon2': '1.550', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:35,770][63767] DAMAGECOUNT value on done: 17822.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:35,770][63767] Sum rewards: 1.850, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.236', 'AMMO5': '0.018', 'WEAPON1': '0.030', 'AMMO2': '0.035', 'weapon4': '0.106', 'AMMO3': '0.107', 'AMMO4': '0.173', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'WEAPON5': '0.350', 'weapon5': '0.484', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.690', 'weapon3': '1.108', 'weapon2': '1.966', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:37,022][63733] Updated weights for policy 1, policy_version 2290 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:37,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11264.0, 300 sec: 11260.5). Total num frames: 18182144. Throughput: 0: 841.1, 1: 1969.0. Samples: 4538968. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:37,460][109198] Avg episode reward: [(0, '-0.860'), (1, '-2.695')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:38,387][63732] Updated weights for policy 0, policy_version 2150 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:38,580][63771] DAMAGECOUNT value on done: 11946.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:38,968][63771] DAMAGECOUNT value on done: 14800.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:38,968][63771] Sum rewards: -0.162, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.012', 'AMMO2': '0.016', 'ARMOR': '0.045', 'WEAPON1': '0.060', 'AMMO3': '0.070', 'AMMO4': '0.080', 'HEALTH': '0.084', 'HITCOUNT': '0.100', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.264', 'WEAPON3': '0.350', 'weapon5': '0.476', 'FRAGCOUNT': '1.000', 'weapon3': '1.420', 'weapon2': '1.610'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:40,604][63734] DAMAGECOUNT value on done: 15627.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:40,604][63734] Sum rewards: 0.577, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.029', 'AMMO2': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.050', 'ARMOR': '0.088', 'weapon5': '0.090', 'AMMO3': '0.105', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.218', 'HITCOUNT': '0.230', 'WEAPON3': '0.700', 'weapon2': '0.904', 'DAMAGECOUNT': '0.912', 'weapon3': '1.886', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:40,944][63734] DAMAGECOUNT value on done: 13449.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:40,944][63734] Sum rewards: 1.229, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.132', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'weapon5': '0.016', 'AMMO2': '0.025', 'AMMO4': '0.123', 'AMMO3': '0.134', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'HITCOUNT': '0.450', 'ARMOR': '0.517', 'WEAPON3': '0.700', 'weapon4': '0.738', 'weapon2': '1.072', 'DAMAGECOUNT': '1.452', 'weapon3': '1.614', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:41,160][63805] DAMAGECOUNT value on done: 14976.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:41,328][63770] DAMAGECOUNT value on done: 11802.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:41,329][63770] Sum rewards: 1.330, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.752', 'AMMO2': '0.001', 'AMMO4': '0.006', 'AMMO5': '0.025', 'WEAPON1': '0.060', 'WEAPON4': '0.100', 'AMMO3': '0.109', 'weapon5': '0.168', 'weapon4': '0.206', 'HITCOUNT': '0.350', 'WEAPON5': '0.400', 'WEAPON3': '0.750', 'weapon2': '1.090', 'DAMAGECOUNT': '1.545', 'FRAGCOUNT': '2.000', 'weapon3': '2.022'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:41,500][63805] DAMAGECOUNT value on done: 16060.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:41,500][63805] Sum rewards: -1.635, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.048', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.026', 'weapon5': '0.028', 'ARMOR': '0.096', 'HITCOUNT': '0.110', 'AMMO4': '0.129', 'AMMO3': '0.141', 'WEAPON5': '0.150', 'weapon4': '0.276', 'DAMAGECOUNT': '0.291', 'WEAPON4': '0.300', 'WEAPON3': '0.700', 'weapon3': '1.334', 'weapon2': '1.814', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:41,715][63770] DAMAGECOUNT value on done: 14034.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:41,716][63770] Sum rewards: -5.341, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.576', 'AMMO5': '0.007', 'AMMO2': '0.015', 'AMMO4': '0.073', 'weapon7': '0.094', 'ARMOR': '0.099', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.114', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.150', 'weapon5': '0.182', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.429', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.516', 'weapon3': '1.716'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:42,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11332.3, 300 sec: 11260.5). Total num frames: 18239488. Throughput: 0: 876.9, 1: 1938.1. Samples: 4556028. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:42,460][109198] Avg episode reward: [(0, '-0.841'), (1, '-2.562')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:42,511][63769] DAMAGECOUNT value on done: 14059.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:42,511][63769] Sum rewards: -2.140, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.762', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.022', 'AMMO3': '0.060', 'weapon7': '0.060', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon5': '0.108', 'AMMO4': '0.110', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.414', 'DAMAGECOUNT': '0.540', 'FRAGCOUNT': '1.000', 'weapon3': '1.246', 'weapon2': '1.284'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:42,812][63733] Updated weights for policy 1, policy_version 2300 (0.0013)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:42,903][63806] DAMAGECOUNT value on done: 12804.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:42,907][63769] DAMAGECOUNT value on done: 12365.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:42,908][63769] Sum rewards: 0.406, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.007', 'AMMO2': '0.017', 'WEAPON1': '0.030', 'AMMO4': '0.085', 'AMMO3': '0.090', 'WEAPON5': '0.150', 'HITCOUNT': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.570', 'weapon5': '0.620', 'HEALTH': '0.842', 'weapon3': '1.250', 'weapon2': '1.644', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:43,213][63806] DAMAGECOUNT value on done: 13337.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:43,213][63806] Sum rewards: -1.398, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.290', 'AMMO2': '0.014', 'AMMO5': '0.015', 'WEAPON1': '0.070', 'AMMO4': '0.071', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'weapon4': '0.176', 'HITCOUNT': '0.190', 'WEAPON5': '0.300', 'weapon5': '0.362', 'DAMAGECOUNT': '0.690', 'WEAPON3': '0.700', 'weapon2': '1.422', 'weapon3': '1.670', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:43,485][63769] DAMAGECOUNT value on done: 15277.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:43,485][63769] Sum rewards: -0.971, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.860', 'AMMO5': '0.010', 'AMMO2': '0.022', 'WEAPON1': '0.030', 'weapon5': '0.056', 'weapon7': '0.068', 'ARMOR': '0.080', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.109', 'AMMO3': '0.136', 'HITCOUNT': '0.240', 'WEAPON4': '0.250', 'weapon4': '0.268', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.050', 'weapon3': '1.376', 'weapon2': '1.394', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:43,814][63769] DAMAGECOUNT value on done: 11053.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:43,815][63769] Sum rewards: -2.982, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.400', 'AMMO5': '0.007', 'AMMO2': '0.021', 'WEAPON1': '0.030', 'ARMOR': '0.032', 'weapon5': '0.038', 'AMMO4': '0.107', 'AMMO3': '0.146', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.210', 'weapon4': '0.334', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.891', 'weapon2': '1.580', 'weapon3': '1.622'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:45,928][63735] DAMAGECOUNT value on done: 14389.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:45,929][63735] Sum rewards: -2.712, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.347', 'AMMO4': '-0.060', 'AMMO2': '-0.012', 'ARMOR': '0.008', 'AMMO5': '0.010', 'WEAPON1': '0.050', 'AMMO3': '0.079', 'HITCOUNT': '0.160', 'WEAPON5': '0.250', 'weapon5': '0.272', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.723', 'FRAGCOUNT': '1.000', 'weapon3': '1.418', 'weapon2': '1.636'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:46,292][63735] DAMAGECOUNT value on done: 10613.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:46,293][63735] Sum rewards: -0.941, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.674', 'AMMO5': '0.005', 'weapon5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.012', 'weapon4': '0.024', 'WEAPON5': '0.050', 'AMMO4': '0.059', 'AMMO3': '0.146', 'WEAPON4': '0.150', 'HITCOUNT': '0.270', 'ARMOR': '0.532', 'WEAPON3': '0.900', 'weapon2': '0.926', 'DAMAGECOUNT': '1.005', 'FRAGCOUNT': '2.000', 'weapon3': '2.634'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:47,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11332.3, 300 sec: 11274.4). Total num frames: 18296832. Throughput: 0: 895.0, 1: 1922.8. Samples: 4564577. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:47,460][109198] Avg episode reward: [(0, '-0.891'), (1, '-2.533')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:47,920][63732] Updated weights for policy 0, policy_version 2160 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:48,502][63806] DAMAGECOUNT value on done: 12730.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:48,604][63767] DAMAGECOUNT value on done: 15307.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:48,604][63767] Sum rewards: 1.038, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.736', 'AMMO5': '0.015', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'AMMO4': '0.091', 'weapon7': '0.098', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.128', 'weapon5': '0.174', 'weapon4': '0.194', 'HITCOUNT': '0.200', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.650', 'weapon2': '1.116', 'DAMAGECOUNT': '1.257', 'weapon3': '1.598', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:48,656][63733] Updated weights for policy 1, policy_version 2310 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:48,943][63806] DAMAGECOUNT value on done: 13442.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:48,943][63806] Sum rewards: -1.920, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.370', 'weapon4': '0.002', 'AMMO5': '0.016', 'AMMO2': '0.021', 'WEAPON1': '0.040', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'AMMO4': '0.103', 'HITCOUNT': '0.170', 'AMMO3': '0.181', 'weapon5': '0.206', 'WEAPON5': '0.350', 'weapon2': '0.790', 'WEAPON3': '0.950', 'DAMAGECOUNT': '0.972', 'FRAGCOUNT': '2.000', 'weapon3': '2.308'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:48,983][63767] DAMAGECOUNT value on done: 14839.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:48,984][63767] Sum rewards: -1.442, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.958', 'AMMO5': '0.005', 'AMMO2': '0.014', 'weapon5': '0.020', 'ARMOR': '0.036', 'weapon7': '0.062', 'AMMO4': '0.069', 'WEAPON5': '0.100', 'AMMO3': '0.113', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.150', 'weapon4': '0.160', 'WEAPON7': '0.200', 'HITCOUNT': '0.250', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.305', 'weapon2': '1.510', 'weapon3': '1.682', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:51,428][63735] DAMAGECOUNT value on done: 11978.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:51,905][63735] DAMAGECOUNT value on done: 16262.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:51,906][63735] Sum rewards: -4.967, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.383', 'AMMO5': '0.013', 'AMMO2': '0.029', 'WEAPON1': '0.030', 'ARMOR': '0.044', 'weapon5': '0.072', 'AMMO4': '0.144', 'AMMO3': '0.176', 'HITCOUNT': '0.210', 'WEAPON5': '0.250', 'weapon4': '0.262', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.645', 'WEAPON3': '1.100', 'weapon2': '1.456', 'weapon3': '1.686', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:52,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11264.0, 300 sec: 11260.5). Total num frames: 18350080. Throughput: 0: 928.1, 1: 1887.1. Samples: 4581383. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:52,460][109198] Avg episode reward: [(0, '-0.859'), (1, '-2.615')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:52,490][63805] DAMAGECOUNT value on done: 14330.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:52,491][63805] Sum rewards: 0.288, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.468', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'AMMO5': '0.013', 'WEAPON1': '0.030', 'ARMOR': '0.070', 'AMMO3': '0.101', 'HITCOUNT': '0.140', 'WEAPON5': '0.250', 'weapon5': '0.512', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.650', 'weapon3': '1.292', 'weapon2': '1.606', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:52,883][63805] DAMAGECOUNT value on done: 12312.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:52,883][63805] Sum rewards: -2.499, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.606', 'AMMO5': '0.015', 'AMMO2': '0.017', 'weapon5': '0.040', 'WEAPON1': '0.050', 'ARMOR': '0.077', 'AMMO4': '0.084', 'WEAPON4': '0.100', 'AMMO3': '0.129', 'weapon4': '0.142', 'WEAPON5': '0.250', 'HITCOUNT': '0.330', 'WEAPON3': '0.900', 'weapon2': '1.034', 'DAMAGECOUNT': '1.137', 'FRAGCOUNT': '2.000', 'weapon3': '2.302'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:54,416][63771] DAMAGECOUNT value on done: 13933.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:54,417][63771] Sum rewards: -3.809, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.435', 'WEAPON1': '0.010', 'weapon5': '0.014', 'AMMO5': '0.018', 'AMMO2': '0.029', 'ARMOR': '0.116', 'AMMO4': '0.142', 'AMMO3': '0.161', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'WEAPON5': '0.350', 'weapon4': '0.414', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.831', 'weapon2': '1.104', 'weapon3': '1.818', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:54,488][63733] Updated weights for policy 1, policy_version 2320 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:54,845][63771] DAMAGECOUNT value on done: 10804.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:54,845][63771] Sum rewards: 2.787, reward structure: {'DEATHCOUNT': '-4.500', 'ARMOR': '0.004', 'AMMO5': '0.005', 'AMMO2': '0.007', 'weapon5': '0.022', 'AMMO4': '0.032', 'WEAPON1': '0.050', 'AMMO3': '0.057', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'weapon7': '0.134', 'HITCOUNT': '0.230', 'WEAPON3': '0.300', 'HEALTH': '0.426', 'weapon3': '0.928', 'DAMAGECOUNT': '1.020', 'weapon2': '1.672', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:55,271][63734] DAMAGECOUNT value on done: 13214.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:55,271][63734] Sum rewards: -2.472, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.582', 'AMMO2': '0.000', 'AMMO4': '0.001', 'AMMO5': '0.024', 'WEAPON1': '0.080', 'AMMO3': '0.121', 'HITCOUNT': '0.150', 'weapon5': '0.384', 'WEAPON5': '0.500', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.702', 'weapon2': '1.334', 'weapon3': '1.914'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:55,655][63734] DAMAGECOUNT value on done: 12999.0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:57,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11264.0, 300 sec: 11260.5). Total num frames: 18407424. Throughput: 0: 966.2, 1: 1859.4. Samples: 4598297. Policy #0 lag: (min: 0.0, avg: 0.3, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:03:57,460][109198] Avg episode reward: [(0, '-0.885'), (1, '-2.596')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:57,570][63732] Updated weights for policy 0, policy_version 2170 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:59,806][63770] DAMAGECOUNT value on done: 15287.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:59,806][63770] Sum rewards: 1.020, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.902', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'AMMO5': '0.005', 'WEAPON1': '0.060', 'AMMO3': '0.074', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.132', 'HITCOUNT': '0.190', 'ARMOR': '0.468', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.780', 'FRAGCOUNT': '1.000', 'weapon2': '1.326', 'weapon3': '1.688'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:59,984][63767] DAMAGECOUNT value on done: 15609.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:03:59,984][63767] Sum rewards: -0.408, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.997', 'AMMO2': '0.009', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.047', 'WEAPON4': '0.050', 'weapon7': '0.076', 'ARMOR': '0.080', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.135', 'weapon4': '0.162', 'weapon5': '0.216', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.753', 'WEAPON3': '0.800', 'weapon2': '1.170', 'weapon3': '1.746', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:00,144][63770] DAMAGECOUNT value on done: 12360.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:00,144][63770] Sum rewards: -1.718, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.667', 'AMMO5': '0.020', 'WEAPON1': '0.030', 'AMMO2': '0.037', 'ARMOR': '0.060', 'weapon5': '0.080', 'weapon4': '0.116', 'AMMO3': '0.143', 'WEAPON4': '0.150', 'AMMO4': '0.183', 'HITCOUNT': '0.250', 'WEAPON5': '0.350', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.930', 'FRAGCOUNT': '1.500', 'weapon2': '1.564', 'weapon3': '1.786'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:00,293][63733] Updated weights for policy 1, policy_version 2330 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:00,416][63767] DAMAGECOUNT value on done: 18102.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:00,416][63767] Sum rewards: 1.626, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.525', 'AMMO5': '0.033', 'AMMO2': '0.037', 'AMMO3': '0.083', 'WEAPON1': '0.090', 'HITCOUNT': '0.170', 'AMMO4': '0.182', 'ARMOR': '0.458', 'WEAPON5': '0.600', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.840', 'weapon2': '0.946', 'weapon5': '1.112', 'weapon3': '1.650', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:02,342][63771] DAMAGECOUNT value on done: 12496.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:02,342][63771] Sum rewards: 2.868, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.523', 'weapon4': '0.006', 'AMMO5': '0.015', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'AMMO4': '0.089', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.104', 'ARMOR': '0.108', 'AMMO3': '0.109', 'weapon5': '0.116', 'WEAPON5': '0.250', 'HITCOUNT': '0.420', 'WEAPON3': '0.700', 'weapon2': '1.454', 'DAMAGECOUNT': '1.650', 'weapon3': '1.932', 'FRAGCOUNT': '3.500'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:02,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11264.0, 300 sec: 11274.4). Total num frames: 18464768. Throughput: 0: 984.3, 1: 1842.0. Samples: 4606834. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:02,459][109198] Avg episode reward: [(0, '-0.958'), (1, '-2.447')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:02,738][63771] DAMAGECOUNT value on done: 15080.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:02,739][63771] Sum rewards: -0.314, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.472', 'AMMO4': '-0.023', 'AMMO2': '-0.005', 'AMMO5': '0.013', 'WEAPON1': '0.050', 'ARMOR': '0.080', 'AMMO3': '0.119', 'weapon5': '0.166', 'HITCOUNT': '0.180', 'WEAPON5': '0.250', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.840', 'weapon2': '1.508', 'weapon3': '1.680', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:03,361][63734] DAMAGECOUNT value on done: 16037.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:03,362][63734] Sum rewards: -2.596, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.948', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.026', 'weapon5': '0.046', 'ARMOR': '0.064', 'weapon7': '0.082', 'WEAPON5': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO4': '0.130', 'AMMO3': '0.131', 'WEAPON7': '0.200', 'WEAPON4': '0.250', 'HITCOUNT': '0.330', 'weapon4': '0.404', 'WEAPON3': '0.600', 'weapon2': '1.002', 'DAMAGECOUNT': '1.230', 'FRAGCOUNT': '1.500', 'weapon3': '1.752'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:03,701][63734] DAMAGECOUNT value on done: 13897.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:03,701][63734] Sum rewards: -0.237, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.130', 'AMMO2': '0.003', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'ARMOR': '0.012', 'AMMO4': '0.013', 'WEAPON4': '0.050', 'weapon4': '0.050', 'weapon5': '0.072', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.142', 'WEAPON5': '0.250', 'HITCOUNT': '0.350', 'WEAPON3': '0.850', 'weapon2': '1.314', 'DAMAGECOUNT': '1.344', 'weapon3': '1.872', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:04,517][63805] DAMAGECOUNT value on done: 15090.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:04,517][63805] Sum rewards: -2.298, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.478', 'AMMO2': '0.009', 'AMMO5': '0.012', 'WEAPON1': '0.040', 'AMMO4': '0.042', 'ARMOR': '0.056', 'weapon4': '0.104', 'HITCOUNT': '0.120', 'AMMO3': '0.137', 'WEAPON4': '0.150', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.342', 'WEAPON3': '0.800', 'weapon5': '0.934', 'FRAGCOUNT': '1.000', 'weapon3': '1.176', 'weapon2': '1.508'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:04,867][63805] DAMAGECOUNT value on done: 16191.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:04,868][63805] Sum rewards: -0.981, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.071', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'AMMO5': '0.007', 'WEAPON1': '0.030', 'weapon7': '0.068', 'AMMO3': '0.079', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.224', 'DAMAGECOUNT': '0.393', 'ARMOR': '0.507', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.366', 'weapon2': '1.758'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:05,008][63770] DAMAGECOUNT value on done: 12122.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:05,009][63770] Sum rewards: 0.811, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.718', 'AMMO5': '0.010', 'AMMO2': '0.023', 'ARMOR': '0.024', 'WEAPON4': '0.050', 'weapon4': '0.066', 'AMMO3': '0.073', 'WEAPON1': '0.100', 'AMMO4': '0.113', 'HITCOUNT': '0.140', 'weapon5': '0.208', 'WEAPON5': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.960', 'weapon3': '1.470', 'weapon2': '1.492', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:05,354][63770] DAMAGECOUNT value on done: 14361.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:05,355][63770] Sum rewards: -1.987, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.651', 'ARMOR': '0.004', 'weapon4': '0.008', 'AMMO5': '0.018', 'AMMO2': '0.022', 'WEAPON1': '0.070', 'WEAPON4': '0.100', 'AMMO4': '0.111', 'AMMO3': '0.134', 'HITCOUNT': '0.220', 'WEAPON5': '0.350', 'weapon5': '0.526', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.981', 'weapon2': '1.126', 'weapon3': '1.944', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:05,993][63769] DAMAGECOUNT value on done: 15742.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:05,994][63769] Sum rewards: -0.540, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.540', 'AMMO2': '0.015', 'AMMO5': '0.019', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'AMMO4': '0.074', 'weapon4': '0.080', 'AMMO3': '0.111', 'HITCOUNT': '0.120', 'weapon5': '0.388', 'WEAPON5': '0.450', 'WEAPON3': '0.600', 'weapon2': '1.208', 'DAMAGECOUNT': '1.395', 'weapon3': '1.688', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:06,093][63733] Updated weights for policy 1, policy_version 2340 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:06,354][63806] DAMAGECOUNT value on done: 13205.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:06,355][63806] Sum rewards: 0.044, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.706', 'weapon4': '0.002', 'AMMO5': '0.007', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'AMMO4': '0.037', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'AMMO3': '0.100', 'WEAPON5': '0.150', 'weapon5': '0.222', 'HITCOUNT': '0.340', 'WEAPON3': '0.550', 'DAMAGECOUNT': '1.203', 'weapon3': '1.324', 'weapon2': '1.956', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:06,363][63769] DAMAGECOUNT value on done: 11287.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:06,364][63769] Sum rewards: -0.096, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.284', 'AMMO4': '-0.049', 'AMMO2': '-0.010', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'weapon7': '0.062', 'ARMOR': '0.068', 'AMMO3': '0.101', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon5': '0.140', 'WEAPON5': '0.150', 'WEAPON7': '0.200', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.702', 'WEAPON3': '0.750', 'weapon2': '1.468', 'weapon3': '1.880', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:06,729][63806] DAMAGECOUNT value on done: 13530.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:06,729][63806] Sum rewards: 1.538, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO2': '0.022', 'AMMO5': '0.022', 'ARMOR': '0.040', 'weapon4': '0.040', 'WEAPON1': '0.060', 'AMMO3': '0.080', 'WEAPON4': '0.100', 'AMMO4': '0.109', 'HITCOUNT': '0.180', 'weapon5': '0.292', 'HEALTH': '0.314', 'WEAPON3': '0.450', 'WEAPON5': '0.450', 'DAMAGECOUNT': '0.579', 'weapon3': '1.452', 'weapon2': '1.848', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:07,081][63732] Updated weights for policy 0, policy_version 2180 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:07,369][63769] DAMAGECOUNT value on done: 14594.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:07,370][63769] Sum rewards: 0.477, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.410', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'AMMO3': '0.092', 'weapon7': '0.130', 'AMMO6': '0.220', 'AMMO7': '0.220', 'WEAPON7': '0.300', 'HITCOUNT': '0.310', 'ARMOR': '0.416', 'WEAPON3': '0.600', 'weapon3': '1.482', 'weapon2': '1.516', 'DAMAGECOUNT': '1.605', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:07,458][109198] Fps is (10 sec: 11468.9, 60 sec: 11332.3, 300 sec: 11274.4). Total num frames: 18522112. Throughput: 0: 1019.4, 1: 1808.4. Samples: 4623850. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:07,459][109198] Avg episode reward: [(0, '-1.005'), (1, '-2.330')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:07,718][63769] DAMAGECOUNT value on done: 12758.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:07,719][63769] Sum rewards: -2.666, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.596', 'AMMO2': '0.019', 'AMMO5': '0.027', 'ARMOR': '0.028', 'WEAPON1': '0.070', 'AMMO4': '0.094', 'WEAPON4': '0.100', 'weapon4': '0.112', 'AMMO3': '0.172', 'weapon5': '0.226', 'HITCOUNT': '0.340', 'WEAPON5': '0.400', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.179', 'weapon2': '1.618', 'weapon3': '1.646', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:09,229][63735] DAMAGECOUNT value on done: 14544.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:09,230][63735] Sum rewards: -0.686, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.319', 'AMMO5': '0.005', 'AMMO2': '0.014', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.070', 'AMMO3': '0.082', 'WEAPON5': '0.100', 'HITCOUNT': '0.130', 'weapon5': '0.184', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.500', 'ARMOR': '0.552', 'FRAGCOUNT': '1.000', 'weapon2': '1.182', 'weapon3': '1.278'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:09,597][63735] DAMAGECOUNT value on done: 11075.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:09,597][63735] Sum rewards: 1.311, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.514', 'AMMO5': '0.010', 'AMMO2': '0.014', 'weapon4': '0.044', 'WEAPON1': '0.060', 'AMMO4': '0.069', 'ARMOR': '0.076', 'AMMO3': '0.130', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'weapon5': '0.200', 'HITCOUNT': '0.310', 'WEAPON3': '0.700', 'weapon2': '1.216', 'DAMAGECOUNT': '1.386', 'weapon3': '1.760', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:11,165][63767] DAMAGECOUNT value on done: 15496.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:11,166][63767] Sum rewards: -0.082, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.453', 'AMMO4': '-0.010', 'AMMO2': '-0.002', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO3': '0.074', 'weapon5': '0.104', 'HITCOUNT': '0.150', 'WEAPON5': '0.200', 'ARMOR': '0.532', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.567', 'weapon3': '1.414', 'weapon2': '1.514', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:11,552][63767] DAMAGECOUNT value on done: 15318.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:11,553][63767] Sum rewards: -1.420, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.508', 'AMMO2': '0.004', 'AMMO5': '0.012', 'AMMO4': '0.022', 'ARMOR': '0.040', 'AMMO3': '0.162', 'weapon5': '0.168', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.300', 'HITCOUNT': '0.310', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.437', 'weapon2': '1.508', 'weapon3': '1.924'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:11,949][63733] Updated weights for policy 1, policy_version 2350 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:12,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11264.0, 300 sec: 11260.5). Total num frames: 18575360. Throughput: 0: 1049.3, 1: 1780.7. Samples: 4640691. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:12,460][109198] Avg episode reward: [(0, '-0.977'), (1, '-2.322')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:12,919][63806] DAMAGECOUNT value on done: 12969.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:13,358][63806] DAMAGECOUNT value on done: 13887.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:13,358][63806] Sum rewards: -0.571, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.423', 'weapon5': '0.006', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.025', 'ARMOR': '0.088', 'AMMO4': '0.125', 'AMMO3': '0.128', 'WEAPON5': '0.150', 'weapon4': '0.222', 'WEAPON4': '0.300', 'HITCOUNT': '0.430', 'WEAPON3': '0.750', 'weapon2': '0.896', 'DAMAGECOUNT': '1.335', 'weapon3': '2.126', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:15,787][63805] DAMAGECOUNT value on done: 14479.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:15,788][63805] Sum rewards: -1.814, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.970', 'AMMO2': '0.007', 'AMMO5': '0.015', 'AMMO4': '0.035', 'ARMOR': '0.040', 'WEAPON1': '0.050', 'HITCOUNT': '0.140', 'AMMO3': '0.147', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.447', 'WEAPON3': '0.700', 'weapon5': '0.804', 'FRAGCOUNT': '1.000', 'weapon3': '1.340', 'weapon2': '1.630'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:16,154][63735] DAMAGECOUNT value on done: 12158.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:16,154][63735] Sum rewards: -3.204, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.636', 'AMMO2': '0.015', 'AMMO5': '0.018', 'ARMOR': '0.044', 'WEAPON1': '0.050', 'AMMO4': '0.073', 'AMMO3': '0.128', 'WEAPON4': '0.150', 'weapon4': '0.162', 'HITCOUNT': '0.170', 'weapon5': '0.268', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.540', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.374', 'weapon3': '1.490'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:16,180][63805] DAMAGECOUNT value on done: 12645.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:16,181][63805] Sum rewards: 1.103, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.782', 'AMMO2': '0.013', 'AMMO5': '0.018', 'ARMOR': '0.040', 'WEAPON1': '0.040', 'AMMO4': '0.063', 'AMMO3': '0.124', 'WEAPON4': '0.150', 'weapon4': '0.164', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'weapon5': '0.416', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.999', 'weapon3': '1.268', 'weapon2': '1.820', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:16,475][63735] DAMAGECOUNT value on done: 16613.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:16,475][63735] Sum rewards: 0.238, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.480', 'AMMO5': '0.003', 'AMMO2': '0.003', 'weapon5': '0.014', 'AMMO4': '0.016', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'ARMOR': '0.080', 'weapon4': '0.118', 'AMMO3': '0.123', 'HITCOUNT': '0.250', 'WEAPON3': '0.500', 'DAMAGECOUNT': '1.053', 'weapon2': '1.372', 'weapon3': '1.586', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:16,826][63732] Updated weights for policy 0, policy_version 2190 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:17,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11264.0, 300 sec: 11260.5). Total num frames: 18632704. Throughput: 0: 1055.4, 1: 1774.1. Samples: 4648994. Policy #0 lag: (min: 0.0, avg: 0.3, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:17,460][109198] Avg episode reward: [(0, '-0.947'), (1, '-2.259')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:17,851][63733] Updated weights for policy 1, policy_version 2360 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:19,257][63734] DAMAGECOUNT value on done: 13454.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:19,258][63734] Sum rewards: -3.160, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.588', 'AMMO2': '0.008', 'AMMO5': '0.023', 'AMMO4': '0.038', 'ARMOR': '0.040', 'weapon5': '0.068', 'WEAPON1': '0.070', 'AMMO3': '0.158', 'HITCOUNT': '0.190', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.720', 'WEAPON3': '0.950', 'weapon2': '1.606', 'weapon3': '1.958', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:19,658][63734] DAMAGECOUNT value on done: 13169.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:19,659][63734] Sum rewards: -6.870, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.755', 'AMMO2': '0.012', 'AMMO5': '0.025', 'ARMOR': '0.036', 'WEAPON1': '0.040', 'AMMO4': '0.061', 'AMMO3': '0.115', 'weapon4': '0.116', 'weapon5': '0.136', 'HITCOUNT': '0.190', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.612', 'weapon2': '1.782'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:19,681][63771] DAMAGECOUNT value on done: 14355.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:19,681][63771] Sum rewards: -2.159, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.631', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'AMMO5': '0.010', 'ARMOR': '0.068', 'weapon5': '0.128', 'AMMO3': '0.164', 'WEAPON5': '0.200', 'HITCOUNT': '0.280', 'WEAPON3': '1.100', 'weapon2': '1.204', 'DAMAGECOUNT': '1.266', 'FRAGCOUNT': '2.000', 'weapon3': '2.332'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:20,073][63771] DAMAGECOUNT value on done: 11094.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:20,074][63771] Sum rewards: -5.165, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.074', 'AMMO5': '0.018', 'AMMO2': '0.019', 'ARMOR': '0.044', 'WEAPON4': '0.050', 'WEAPON1': '0.070', 'AMMO4': '0.096', 'weapon5': '0.104', 'AMMO3': '0.132', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.870', 'weapon2': '1.390', 'FRAGCOUNT': '2.000', 'weapon3': '2.046'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:22,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11195.7, 300 sec: 11246.6). Total num frames: 18685952. Throughput: 0: 1062.2, 1: 1751.8. Samples: 4665600. Policy #0 lag: (min: 0.0, avg: 0.1, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:22,460][109198] Avg episode reward: [(0, '-0.923'), (1, '-2.323')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:23,795][63733] Updated weights for policy 1, policy_version 2370 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:25,109][63767] DAMAGECOUNT value on done: 15731.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:25,109][63767] Sum rewards: -4.570, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.015', 'ARMOR': '0.028', 'AMMO2': '0.033', 'WEAPON1': '0.050', 'WEAPON4': '0.100', 'AMMO3': '0.106', 'HITCOUNT': '0.130', 'HEALTH': '0.140', 'AMMO4': '0.166', 'weapon5': '0.170', 'WEAPON5': '0.250', 'weapon4': '0.336', 'DAMAGECOUNT': '0.366', 'WEAPON3': '0.500', 'weapon2': '1.032', 'weapon3': '1.758'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:25,229][63770] DAMAGECOUNT value on done: 15584.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:25,230][63770] Sum rewards: 0.533, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.602', 'AMMO5': '0.020', 'AMMO2': '0.023', 'weapon4': '0.070', 'AMMO3': '0.084', 'WEAPON1': '0.110', 'AMMO4': '0.116', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'weapon5': '0.236', 'WEAPON5': '0.450', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.891', 'weapon2': '1.214', 'weapon3': '1.570', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:25,520][63767] DAMAGECOUNT value on done: 18207.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:25,667][63770] DAMAGECOUNT value on done: 12825.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:25,668][63770] Sum rewards: 1.169, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.185', 'AMMO2': '0.010', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.048', 'ARMOR': '0.052', 'weapon7': '0.062', 'weapon5': '0.082', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.133', 'WEAPON5': '0.200', 'HITCOUNT': '0.320', 'WEAPON3': '0.800', 'weapon2': '1.380', 'DAMAGECOUNT': '1.395', 'weapon3': '1.790', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:26,341][63734] DAMAGECOUNT value on done: 16323.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:26,341][63734] Sum rewards: -4.945, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.580', 'AMMO2': '0.002', 'AMMO4': '0.012', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.028', 'AMMO3': '0.189', 'HITCOUNT': '0.190', 'weapon5': '0.192', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.858', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.192', 'weapon3': '1.934'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:26,433][63771] DAMAGECOUNT value on done: 12561.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:26,434][63771] Sum rewards: -2.188, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.244', 'AMMO5': '0.007', 'AMMO2': '0.018', 'WEAPON1': '0.050', 'HITCOUNT': '0.060', 'ARMOR': '0.080', 'AMMO4': '0.091', 'AMMO3': '0.100', 'weapon4': '0.132', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.195', 'WEAPON5': '0.200', 'weapon5': '0.214', 'WEAPON3': '0.550', 'weapon3': '0.940', 'FRAGCOUNT': '1.000', 'weapon2': '1.768'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:26,481][63732] Updated weights for policy 0, policy_version 2200 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:26,722][63734] DAMAGECOUNT value on done: 14090.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:26,723][63734] Sum rewards: -2.174, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.515', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.023', 'WEAPON1': '0.040', 'weapon5': '0.068', 'AMMO3': '0.091', 'weapon4': '0.092', 'WEAPON4': '0.100', 'ARMOR': '0.128', 'HITCOUNT': '0.190', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.579', 'WEAPON3': '0.700', 'weapon3': '1.556', 'weapon2': '1.612', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:26,838][63771] DAMAGECOUNT value on done: 15510.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:26,838][63771] Sum rewards: 0.402, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.149', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'WEAPON1': '0.010', 'AMMO5': '0.010', 'weapon4': '0.028', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO3': '0.117', 'WEAPON5': '0.200', 'HITCOUNT': '0.300', 'weapon5': '0.392', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.290', 'weapon2': '1.600', 'weapon3': '1.742', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:27,458][109198] Fps is (10 sec: 11468.7, 60 sec: 11332.3, 300 sec: 11246.6). Total num frames: 18747392. Throughput: 0: 1063.2, 1: 1750.6. Samples: 4682645. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:27,460][109198] Avg episode reward: [(0, '-1.049'), (1, '-2.069')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:27,467][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002201_9015296.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:27,467][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000002376_9732096.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:27,518][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001995_8171520.pth\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:27,528][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001924_7880704.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:27,535][63576] Saving new best policy, reward=-2.069!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:27,720][63805] DAMAGECOUNT value on done: 15265.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:27,721][63805] Sum rewards: -0.284, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.897', 'AMMO5': '0.010', 'AMMO2': '0.012', 'weapon5': '0.032', 'WEAPON1': '0.040', 'AMMO4': '0.057', 'AMMO3': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'weapon4': '0.264', 'DAMAGECOUNT': '0.525', 'ARMOR': '0.545', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon2': '1.514', 'weapon3': '1.544'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:28,136][63805] DAMAGECOUNT value on done: 16411.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:28,136][63805] Sum rewards: -1.987, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.850', 'AMMO4': '-0.034', 'AMMO2': '-0.007', 'AMMO5': '0.012', 'WEAPON1': '0.060', 'ARMOR': '0.069', 'AMMO3': '0.086', 'HITCOUNT': '0.180', 'WEAPON5': '0.300', 'weapon5': '0.542', 'DAMAGECOUNT': '0.660', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.312', 'weapon3': '1.682'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:28,703][63769] DAMAGECOUNT value on done: 16272.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:28,704][63769] Sum rewards: -1.062, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.628', 'WEAPON1': '0.010', 'AMMO2': '0.015', 'AMMO5': '0.025', 'weapon4': '0.056', 'AMMO4': '0.075', 'WEAPON4': '0.100', 'AMMO3': '0.164', 'weapon5': '0.216', 'WEAPON5': '0.350', 'HITCOUNT': '0.380', 'WEAPON3': '0.900', 'weapon3': '1.502', 'DAMAGECOUNT': '1.590', 'weapon2': '1.682', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:29,030][63769] DAMAGECOUNT value on done: 11504.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:29,031][63769] Sum rewards: -7.361, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.642', 'AMMO5': '0.003', 'weapon5': '0.008', 'WEAPON1': '0.010', 'AMMO2': '0.015', 'WEAPON5': '0.050', 'weapon4': '0.070', 'AMMO4': '0.074', 'ARMOR': '0.096', 'WEAPON4': '0.150', 'HITCOUNT': '0.180', 'AMMO3': '0.193', 'DAMAGECOUNT': '0.651', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon2': '1.130', 'weapon3': '2.352'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:29,247][63770] DAMAGECOUNT value on done: 13057.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:29,248][63770] Sum rewards: 1.445, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.726', 'AMMO2': '0.001', 'AMMO4': '0.005', 'weapon5': '0.012', 'AMMO5': '0.023', 'WEAPON1': '0.040', 'ARMOR': '0.052', 'weapon7': '0.076', 'AMMO3': '0.079', 'weapon4': '0.142', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.240', 'WEAPON5': '0.350', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.305', 'weapon3': '1.584', 'weapon2': '1.692', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:29,564][63733] Updated weights for policy 1, policy_version 2380 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:29,632][63770] DAMAGECOUNT value on done: 14491.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:29,696][63806] DAMAGECOUNT value on done: 13467.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:30,020][63806] DAMAGECOUNT value on done: 13768.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:30,021][63806] Sum rewards: 2.124, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.768', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.013', 'weapon5': '0.018', 'WEAPON1': '0.050', 'WEAPON4': '0.050', 'AMMO3': '0.098', 'weapon4': '0.124', 'ARMOR': '0.140', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.714', 'weapon3': '1.494', 'weapon2': '1.818', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:32,458][109198] Fps is (10 sec: 11468.8, 60 sec: 11264.0, 300 sec: 11232.8). Total num frames: 18800640. Throughput: 0: 1059.6, 1: 1749.3. Samples: 4690975. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:32,460][109198] Avg episode reward: [(0, '-1.175'), (1, '-1.868')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:32,462][63576] Saving new best policy, reward=-1.868!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:32,469][63769] DAMAGECOUNT value on done: 14821.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:32,469][63769] Sum rewards: 2.910, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.094', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.012', 'ARMOR': '0.015', 'WEAPON5': '0.050', 'AMMO4': '0.058', 'AMMO3': '0.090', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.112', 'weapon5': '0.138', 'WEAPON4': '0.150', 'HITCOUNT': '0.200', 'weapon4': '0.362', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.681', 'weapon2': '1.022', 'weapon3': '1.552', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:32,714][63735] DAMAGECOUNT value on done: 14809.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:32,715][63735] Sum rewards: 1.488, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.455', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.020', 'ARMOR': '0.028', 'WEAPON1': '0.040', 'AMMO3': '0.050', 'WEAPON4': '0.050', 'weapon5': '0.080', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.126', 'weapon4': '0.138', 'HITCOUNT': '0.210', 'WEAPON5': '0.300', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.795', 'FRAGCOUNT': '1.000', 'weapon3': '1.142', 'weapon2': '1.774'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:32,865][63769] DAMAGECOUNT value on done: 12773.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:32,866][63769] Sum rewards: 1.685, reward structure: {'DEATHCOUNT': '-1.500', 'HEALTH': '-0.625', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.005', 'HITCOUNT': '0.010', 'WEAPON1': '0.020', 'AMMO3': '0.036', 'DAMAGECOUNT': '0.045', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon5': '0.490', 'ARMOR': '0.500', 'weapon3': '0.610', 'weapon2': '0.790', 'FRAGCOUNT': '1.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:33,104][63735] DAMAGECOUNT value on done: 11270.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:33,105][63735] Sum rewards: -2.911, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.515', 'AMMO2': '0.016', 'AMMO5': '0.023', 'weapon4': '0.042', 'AMMO4': '0.077', 'WEAPON1': '0.090', 'WEAPON4': '0.100', 'AMMO3': '0.111', 'HITCOUNT': '0.130', 'weapon5': '0.350', 'WEAPON5': '0.450', 'DAMAGECOUNT': '0.585', 'WEAPON3': '0.750', 'weapon3': '1.530', 'weapon2': '1.600', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:33,523][63767] DAMAGECOUNT value on done: 15573.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:33,906][63767] DAMAGECOUNT value on done: 15613.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:33,906][63767] Sum rewards: -5.814, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.706', 'weapon5': '0.006', 'AMMO2': '0.006', 'AMMO5': '0.015', 'AMMO4': '0.030', 'ARMOR': '0.032', 'WEAPON4': '0.150', 'weapon4': '0.164', 'HITCOUNT': '0.190', 'AMMO3': '0.246', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.885', 'WEAPON3': '1.100', 'weapon2': '1.542', 'weapon3': '1.976', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:35,190][63733] Updated weights for policy 1, policy_version 2390 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:37,032][63732] Updated weights for policy 0, policy_version 2210 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:37,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11264.0, 300 sec: 11232.8). Total num frames: 18857984. Throughput: 0: 1042.4, 1: 1758.2. Samples: 4707408. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:37,460][109198] Avg episode reward: [(0, '-1.220'), (1, '-1.802')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:37,466][63576] Saving new best policy, reward=-1.802!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:37,689][63806] DAMAGECOUNT value on done: 13149.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:37,689][63806] Sum rewards: -0.350, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.612', 'AMMO5': '0.012', 'AMMO2': '0.027', 'WEAPON1': '0.040', 'AMMO3': '0.048', 'ARMOR': '0.098', 'HITCOUNT': '0.120', 'AMMO4': '0.136', 'weapon4': '0.202', 'WEAPON5': '0.250', 'WEAPON4': '0.250', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.540', 'weapon3': '0.864', 'weapon5': '0.896', 'FRAGCOUNT': '1.000', 'weapon2': '1.478'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:38,038][63806] DAMAGECOUNT value on done: 14037.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:39,036][63805] DAMAGECOUNT value on done: 14692.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:39,037][63805] Sum rewards: -0.648, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.826', 'AMMO5': '0.020', 'ARMOR': '0.024', 'AMMO2': '0.030', 'AMMO3': '0.085', 'WEAPON1': '0.090', 'WEAPON4': '0.100', 'weapon4': '0.102', 'AMMO4': '0.150', 'HITCOUNT': '0.160', 'WEAPON3': '0.350', 'weapon5': '0.386', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.639', 'weapon3': '0.928', 'FRAGCOUNT': '1.000', 'weapon2': '1.714'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:39,424][63805] DAMAGECOUNT value on done: 13085.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:39,425][63805] Sum rewards: -2.130, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.103', 'AMMO2': '0.008', 'weapon5': '0.020', 'AMMO5': '0.022', 'ARMOR': '0.032', 'AMMO4': '0.042', 'WEAPON1': '0.070', 'weapon4': '0.074', 'WEAPON4': '0.100', 'AMMO3': '0.170', 'HITCOUNT': '0.250', 'WEAPON5': '0.450', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.320', 'weapon2': '1.686', 'weapon3': '1.828', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:40,850][63733] Updated weights for policy 1, policy_version 2400 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:40,873][63735] DAMAGECOUNT value on done: 12307.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:40,874][63735] Sum rewards: -5.679, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.716', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'ARMOR': '0.035', 'AMMO3': '0.147', 'HITCOUNT': '0.150', 'weapon5': '0.168', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.447', 'WEAPON3': '0.650', 'weapon2': '1.508', 'weapon3': '1.950'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:41,273][63735] DAMAGECOUNT value on done: 16892.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:41,274][63735] Sum rewards: 2.543, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.514', 'AMMO5': '0.007', 'AMMO2': '0.015', 'WEAPON1': '0.040', 'AMMO4': '0.072', 'AMMO3': '0.087', 'weapon4': '0.088', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'weapon5': '0.178', 'HITCOUNT': '0.280', 'ARMOR': '0.570', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.837', 'weapon2': '1.486', 'weapon3': '1.796', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:42,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11195.7, 300 sec: 11232.8). Total num frames: 18911232. Throughput: 0: 1033.0, 1: 1761.8. Samples: 4724063. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:42,460][109198] Avg episode reward: [(0, '-1.343'), (1, '-1.700')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:42,462][63576] Saving new best policy, reward=-1.700!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:43,158][63734] DAMAGECOUNT value on done: 13609.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:43,159][63734] Sum rewards: -0.798, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.128', 'AMMO2': '0.011', 'AMMO5': '0.020', 'WEAPON1': '0.020', 'weapon4': '0.028', 'AMMO4': '0.055', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.102', 'ARMOR': '0.125', 'weapon5': '0.160', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.470', 'weapon2': '1.674'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:43,548][63734] DAMAGECOUNT value on done: 13527.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:43,549][63734] Sum rewards: -1.336, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.766', 'AMMO2': '0.013', 'AMMO5': '0.018', 'weapon4': '0.020', 'ARMOR': '0.040', 'AMMO4': '0.063', 'WEAPON1': '0.090', 'WEAPON4': '0.150', 'AMMO3': '0.159', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'weapon5': '0.464', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.074', 'weapon2': '1.178', 'weapon3': '1.802', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:44,977][63771] DAMAGECOUNT value on done: 14470.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:45,361][63771] DAMAGECOUNT value on done: 11274.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:46,760][63733] Updated weights for policy 1, policy_version 2410 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:47,159][63732] Updated weights for policy 0, policy_version 2220 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:47,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11195.7, 300 sec: 11232.8). Total num frames: 18968576. Throughput: 0: 1029.2, 1: 1760.9. Samples: 4732391. Policy #0 lag: (min: 0.0, avg: 0.3, max: 2.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:47,460][109198] Avg episode reward: [(0, '-1.416'), (1, '-1.695')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:47,466][63576] Saving new best policy, reward=-1.695!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:50,013][63767] DAMAGECOUNT value on done: 15914.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:50,014][63767] Sum rewards: -2.821, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.720', 'AMMO5': '0.007', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'weapon5': '0.046', 'WEAPON4': '0.050', 'AMMO4': '0.059', 'HITCOUNT': '0.140', 'weapon4': '0.140', 'AMMO3': '0.177', 'WEAPON5': '0.200', 'ARMOR': '0.472', 'DAMAGECOUNT': '0.549', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.434', 'weapon3': '1.692'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:50,446][63767] DAMAGECOUNT value on done: 18452.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:50,446][63767] Sum rewards: -1.538, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.235', 'AMMO2': '0.009', 'AMMO5': '0.015', 'WEAPON1': '0.030', 'weapon4': '0.034', 'ARMOR': '0.036', 'AMMO4': '0.045', 'WEAPON4': '0.100', 'AMMO3': '0.121', 'HITCOUNT': '0.210', 'weapon5': '0.248', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.735', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.194', 'weapon3': '2.120'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:50,639][63770] DAMAGECOUNT value on done: 16023.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:50,639][63770] Sum rewards: -0.041, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.066', 'AMMO2': '0.010', 'AMMO5': '0.012', 'weapon4': '0.028', 'AMMO4': '0.050', 'WEAPON1': '0.050', 'ARMOR': '0.088', 'WEAPON4': '0.100', 'AMMO3': '0.126', 'weapon5': '0.132', 'WEAPON5': '0.250', 'HITCOUNT': '0.370', 'WEAPON3': '0.850', 'weapon2': '1.262', 'DAMAGECOUNT': '1.317', 'weapon3': '2.130', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:51,048][63770] DAMAGECOUNT value on done: 13060.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:51,049][63770] Sum rewards: -5.206, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.014', 'AMMO5': '0.003', 'AMMO2': '0.008', 'WEAPON1': '0.020', 'AMMO4': '0.042', 'weapon5': '0.074', 'WEAPON5': '0.100', 'weapon4': '0.142', 'HITCOUNT': '0.190', 'WEAPON4': '0.200', 'AMMO3': '0.202', 'ARMOR': '0.412', 'DAMAGECOUNT': '0.705', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon2': '1.186', 'weapon3': '1.974'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:51,273][63805] DAMAGECOUNT value on done: 15507.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:51,273][63805] Sum rewards: 0.183, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '0.005', 'AMMO5': '0.007', 'AMMO2': '0.010', 'weapon4': '0.034', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'AMMO4': '0.051', 'ARMOR': '0.068', 'AMMO3': '0.099', 'WEAPON5': '0.150', 'HITCOUNT': '0.200', 'weapon5': '0.222', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.726', 'FRAGCOUNT': '1.000', 'weapon2': '1.112', 'weapon3': '1.858'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:51,665][63805] DAMAGECOUNT value on done: 16706.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:51,666][63805] Sum rewards: -3.628, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.760', 'AMMO4': '-0.008', 'AMMO2': '-0.002', 'AMMO5': '0.013', 'weapon4': '0.048', 'WEAPON1': '0.070', 'WEAPON4': '0.100', 'AMMO3': '0.134', 'weapon5': '0.196', 'WEAPON5': '0.250', 'HITCOUNT': '0.270', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.885', 'weapon2': '1.100', 'FRAGCOUNT': '2.000', 'weapon3': '2.226'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:51,716][63734] DAMAGECOUNT value on done: 16598.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:51,717][63734] Sum rewards: -4.082, reward structure: {'DEATHCOUNT': '-10.500', 'AMMO2': '0.006', 'AMMO5': '0.007', 'ARMOR': '0.024', 'AMMO4': '0.028', 'HEALTH': '0.031', 'WEAPON4': '0.050', 'AMMO3': '0.126', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'weapon5': '0.294', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.825', 'weapon2': '1.020', 'weapon3': '2.386'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:51,938][63771] DAMAGECOUNT value on done: 12940.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:51,939][63771] Sum rewards: -0.301, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.349', 'AMMO2': '0.010', 'AMMO5': '0.032', 'AMMO4': '0.050', 'WEAPON1': '0.050', 'AMMO3': '0.171', 'weapon5': '0.244', 'HITCOUNT': '0.360', 'ARMOR': '0.492', 'WEAPON5': '0.500', 'weapon2': '0.816', 'WEAPON3': '1.100', 'DAMAGECOUNT': '1.137', 'weapon3': '2.336', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:52,075][63734] DAMAGECOUNT value on done: 14420.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:52,076][63734] Sum rewards: -0.055, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.195', 'AMMO2': '0.011', 'ARMOR': '0.016', 'AMMO5': '0.022', 'AMMO4': '0.057', 'WEAPON1': '0.080', 'WEAPON4': '0.100', 'weapon4': '0.132', 'AMMO3': '0.153', 'weapon5': '0.166', 'HITCOUNT': '0.270', 'WEAPON5': '0.450', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.990', 'weapon2': '1.452', 'weapon3': '1.690', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:52,336][63771] DAMAGECOUNT value on done: 15805.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:52,336][63771] Sum rewards: -6.620, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.108', 'AMMO2': '0.007', 'AMMO5': '0.007', 'weapon5': '0.026', 'AMMO4': '0.036', 'WEAPON1': '0.060', 'ARMOR': '0.104', 'WEAPON5': '0.150', 'AMMO3': '0.166', 'weapon4': '0.188', 'HITCOUNT': '0.230', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.885', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '1.616', 'weapon2': '1.812'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:52,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11195.7, 300 sec: 11218.9). Total num frames: 19021824. Throughput: 0: 1020.3, 1: 1752.6. Samples: 4748632. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:52,460][109198] Avg episode reward: [(0, '-1.547'), (1, '-1.704')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:52,802][63733] Updated weights for policy 1, policy_version 2420 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:53,093][63806] DAMAGECOUNT value on done: 13635.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:53,093][63806] Sum rewards: -3.274, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.980', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.011', 'WEAPON1': '0.030', 'AMMO4': '0.053', 'ARMOR': '0.125', 'AMMO3': '0.131', 'weapon4': '0.146', 'WEAPON4': '0.150', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.504', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.698', 'weapon2': '1.730'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:53,358][63770] DAMAGECOUNT value on done: 13376.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:53,359][63770] Sum rewards: 1.305, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.475', 'AMMO2': '0.008', 'AMMO5': '0.015', 'AMMO4': '0.040', 'WEAPON1': '0.070', 'AMMO3': '0.091', 'HITCOUNT': '0.180', 'WEAPON5': '0.350', 'WEAPON3': '0.650', 'weapon5': '0.920', 'DAMAGECOUNT': '0.957', 'weapon3': '1.282', 'weapon2': '1.466', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:53,471][63806] DAMAGECOUNT value on done: 14238.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:53,471][63806] Sum rewards: 5.599, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.624', 'AMMO4': '-0.008', 'AMMO2': '-0.002', 'weapon4': '0.022', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'AMMO3': '0.103', 'HITCOUNT': '0.360', 'ARMOR': '0.478', 'WEAPON3': '0.550', 'weapon2': '1.152', 'DAMAGECOUNT': '1.410', 'weapon3': '2.068', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:53,728][63770] DAMAGECOUNT value on done: 14786.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:53,729][63770] Sum rewards: -2.592, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.903', 'AMMO5': '0.010', 'AMMO2': '0.025', 'WEAPON1': '0.040', 'ARMOR': '0.088', 'AMMO3': '0.096', 'AMMO4': '0.126', 'weapon5': '0.138', 'weapon4': '0.196', 'WEAPON5': '0.200', 'HITCOUNT': '0.250', 'WEAPON4': '0.350', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.885', 'FRAGCOUNT': '1.000', 'weapon2': '1.614', 'weapon3': '1.642'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:54,003][63769] DAMAGECOUNT value on done: 16519.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:54,004][63769] Sum rewards: -3.225, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.136', 'AMMO2': '0.007', 'AMMO5': '0.007', 'weapon5': '0.008', 'WEAPON1': '0.010', 'AMMO4': '0.035', 'WEAPON4': '0.050', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon4': '0.120', 'weapon7': '0.128', 'WEAPON5': '0.150', 'AMMO3': '0.173', 'HITCOUNT': '0.190', 'WEAPON7': '0.200', 'ARMOR': '0.448', 'DAMAGECOUNT': '0.741', 'weapon2': '0.762', 'WEAPON3': '1.000', 'FRAGCOUNT': '2.000', 'weapon3': '2.392'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:54,403][63769] DAMAGECOUNT value on done: 11749.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:54,404][63769] Sum rewards: -0.264, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.751', 'AMMO2': '0.003', 'AMMO4': '0.017', 'WEAPON1': '0.020', 'AMMO5': '0.022', 'ARMOR': '0.080', 'weapon5': '0.082', 'AMMO3': '0.159', 'HITCOUNT': '0.200', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.735', 'WEAPON3': '0.850', 'weapon2': '1.616', 'weapon3': '1.852', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:55,823][63767] DAMAGECOUNT value on done: 15853.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:55,823][63767] Sum rewards: -4.869, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.508', 'FRAGCOUNT': '-1.000', 'AMMO5': '0.014', 'AMMO2': '0.015', 'weapon4': '0.068', 'AMMO4': '0.073', 'ARMOR': '0.100', 'AMMO3': '0.117', 'weapon5': '0.156', 'WEAPON4': '0.200', 'HITCOUNT': '0.240', 'WEAPON5': '0.300', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.840', 'weapon2': '1.154', 'weapon3': '1.812'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:56,218][63767] DAMAGECOUNT value on done: 15825.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:56,219][63767] Sum rewards: -0.150, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.888', 'AMMO5': '0.009', 'AMMO2': '0.016', 'WEAPON1': '0.030', 'ARMOR': '0.036', 'weapon7': '0.050', 'AMMO4': '0.078', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.145', 'WEAPON5': '0.150', 'HITCOUNT': '0.190', 'WEAPON7': '0.200', 'weapon4': '0.200', 'weapon5': '0.244', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.636', 'WEAPON3': '0.650', 'weapon2': '0.684', 'weapon3': '1.830'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:56,245][63735] DAMAGECOUNT value on done: 14956.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:56,245][63735] Sum rewards: 0.186, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.373', 'AMMO2': '0.009', 'AMMO5': '0.010', 'weapon5': '0.018', 'WEAPON1': '0.020', 'AMMO4': '0.044', 'weapon7': '0.050', 'ARMOR': '0.080', 'AMMO3': '0.093', 'WEAPON4': '0.100', 'HITCOUNT': '0.130', 'WEAPON5': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'DAMAGECOUNT': '0.441', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.354', 'weapon3': '1.960'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:56,612][63735] DAMAGECOUNT value on done: 11517.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:56,613][63735] Sum rewards: -2.808, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.580', 'AMMO5': '0.007', 'AMMO2': '0.015', 'ARMOR': '0.016', 'WEAPON1': '0.030', 'weapon5': '0.076', 'AMMO4': '0.077', 'WEAPON5': '0.150', 'AMMO3': '0.157', 'HITCOUNT': '0.230', 'DAMAGECOUNT': '0.741', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.254', 'weapon3': '2.218'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:57,124][63732] Updated weights for policy 0, policy_version 2230 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:57,458][109198] Fps is (10 sec: 10649.6, 60 sec: 11127.5, 300 sec: 11205.2). Total num frames: 19075072. Throughput: 0: 1019.8, 1: 1746.7. Samples: 4765182. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:04:57,460][109198] Avg episode reward: [(0, '-1.622'), (1, '-1.607')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:57,465][63576] Saving new best policy, reward=-1.607!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:57,778][63769] DAMAGECOUNT value on done: 15001.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:57,778][63769] Sum rewards: 0.281, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.419', 'AMMO5': '0.003', 'AMMO2': '0.009', 'WEAPON1': '0.020', 'AMMO4': '0.045', 'WEAPON5': '0.050', 'weapon7': '0.052', 'weapon4': '0.056', 'AMMO3': '0.074', 'WEAPON4': '0.100', 'weapon5': '0.116', 'HITCOUNT': '0.140', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'WEAPON3': '0.450', 'ARMOR': '0.529', 'DAMAGECOUNT': '0.540', 'FRAGCOUNT': '1.000', 'weapon3': '1.302', 'weapon2': '1.694'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:58,222][63769] DAMAGECOUNT value on done: 12883.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:58,223][63769] Sum rewards: -1.831, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.770', 'ARMOR': '0.008', 'AMMO2': '0.008', 'AMMO5': '0.010', 'WEAPON1': '0.030', 'AMMO4': '0.042', 'weapon7': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.061', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.104', 'weapon5': '0.150', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.350', 'FRAGCOUNT': '1.000', 'weapon3': '1.042', 'weapon2': '1.724'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:04:58,788][63733] Updated weights for policy 1, policy_version 2430 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:02,309][63806] DAMAGECOUNT value on done: 13289.0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:02,458][109198] Fps is (10 sec: 10649.5, 60 sec: 11059.2, 300 sec: 11191.1). Total num frames: 19128320. Throughput: 0: 1022.6, 1: 1742.0. Samples: 4773400. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:02,460][109198] Avg episode reward: [(0, '-1.591'), (1, '-1.645')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:02,730][63806] DAMAGECOUNT value on done: 14442.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:02,730][63806] Sum rewards: 2.862, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.021', 'AMMO2': '0.017', 'AMMO5': '0.018', 'WEAPON4': '0.050', 'weapon7': '0.052', 'AMMO4': '0.083', 'AMMO3': '0.117', 'weapon5': '0.118', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon4': '0.198', 'WEAPON7': '0.200', 'HITCOUNT': '0.260', 'WEAPON5': '0.350', 'ARMOR': '0.412', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.215', 'weapon2': '1.528', 'weapon3': '1.676', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:04,078][63805] DAMAGECOUNT value on done: 15042.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:04,079][63805] Sum rewards: -4.498, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.314', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.030', 'ARMOR': '0.056', 'weapon5': '0.062', 'weapon4': '0.062', 'WEAPON5': '0.100', 'AMMO4': '0.151', 'AMMO3': '0.162', 'HITCOUNT': '0.180', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.416', 'weapon3': '2.104'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:04,557][63805] DAMAGECOUNT value on done: 13175.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:05,114][63733] Updated weights for policy 1, policy_version 2440 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:05,580][63735] DAMAGECOUNT value on done: 12377.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:05,951][63735] DAMAGECOUNT value on done: 17212.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:05,951][63735] Sum rewards: 0.741, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.940', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'AMMO5': '0.020', 'ARMOR': '0.032', 'WEAPON1': '0.040', 'AMMO3': '0.085', 'HITCOUNT': '0.220', 'WEAPON5': '0.300', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.960', 'weapon5': '1.030', 'weapon2': '1.214', 'weapon3': '1.362', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:06,331][63732] Updated weights for policy 0, policy_version 2240 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:07,045][63734] DAMAGECOUNT value on done: 14016.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:07,046][63734] Sum rewards: 2.346, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.129', 'AMMO5': '0.013', 'AMMO2': '0.027', 'ARMOR': '0.044', 'WEAPON4': '0.050', 'WEAPON1': '0.050', 'AMMO3': '0.092', 'weapon4': '0.108', 'AMMO4': '0.136', 'HITCOUNT': '0.250', 'WEAPON5': '0.250', 'weapon5': '0.334', 'WEAPON3': '0.500', 'DAMAGECOUNT': '1.221', 'weapon3': '1.552', 'weapon2': '1.598', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:07,410][63734] DAMAGECOUNT value on done: 13566.0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:07,458][109198] Fps is (10 sec: 11059.2, 60 sec: 11059.2, 300 sec: 11205.0). Total num frames: 19185664. Throughput: 0: 1028.8, 1: 1731.0. Samples: 4789793. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:07,460][109198] Avg episode reward: [(0, '-1.605'), (1, '-1.512')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:07,469][63576] Saving new best policy, reward=-1.512!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:10,271][63771] DAMAGECOUNT value on done: 14835.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:10,272][63771] Sum rewards: -0.693, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.364', 'AMMO2': '0.016', 'AMMO5': '0.022', 'ARMOR': '0.028', 'WEAPON4': '0.050', 'WEAPON1': '0.060', 'weapon4': '0.074', 'AMMO4': '0.077', 'AMMO3': '0.141', 'weapon5': '0.182', 'HITCOUNT': '0.260', 'WEAPON5': '0.450', 'WEAPON3': '0.950', 'weapon2': '0.960', 'DAMAGECOUNT': '1.095', 'weapon3': '2.306', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:10,609][63771] DAMAGECOUNT value on done: 11650.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:10,609][63771] Sum rewards: -0.857, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.120', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.052', 'AMMO3': '0.124', 'weapon5': '0.212', 'WEAPON5': '0.300', 'HITCOUNT': '0.310', 'WEAPON3': '0.750', 'weapon2': '1.068', 'DAMAGECOUNT': '1.128', 'FRAGCOUNT': '1.500', 'weapon3': '2.048'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:11,588][63733] Updated weights for policy 1, policy_version 2450 (0.0010)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:12,458][109198] Fps is (10 sec: 11059.3, 60 sec: 11059.2, 300 sec: 11177.2). Total num frames: 19238912. Throughput: 0: 1041.7, 1: 1702.6. Samples: 4806138. Policy #0 lag: (min: 0.0, avg: 0.2, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:12,460][109198] Avg episode reward: [(0, '-1.559'), (1, '-1.458')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:12,461][63576] Saving new best policy, reward=-1.458!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:14,736][63805] DAMAGECOUNT value on done: 15782.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:14,736][63805] Sum rewards: 0.978, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.168', 'AMMO2': '0.013', 'AMMO5': '0.025', 'WEAPON1': '0.040', 'weapon4': '0.056', 'AMMO4': '0.064', 'ARMOR': '0.071', 'AMMO3': '0.098', 'HITCOUNT': '0.150', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'weapon5': '0.646', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.825', 'weapon2': '0.922', 'weapon3': '1.736', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:15,080][63732] Updated weights for policy 0, policy_version 2250 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:15,113][63767] DAMAGECOUNT value on done: 16242.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:15,113][63767] Sum rewards: -2.239, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.781', 'AMMO5': '0.010', 'AMMO2': '0.014', 'AMMO4': '0.071', 'WEAPON4': '0.150', 'AMMO3': '0.160', 'weapon5': '0.184', 'WEAPON5': '0.200', 'weapon4': '0.218', 'HITCOUNT': '0.290', 'ARMOR': '0.432', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.984', 'weapon2': '1.150', 'weapon3': '1.828', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:15,142][63805] DAMAGECOUNT value on done: 16849.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:15,461][63767] DAMAGECOUNT value on done: 18623.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:15,462][63767] Sum rewards: 1.098, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-1.145', 'AMMO5': '0.009', 'AMMO2': '0.019', 'WEAPON1': '0.020', 'AMMO3': '0.054', 'AMMO4': '0.093', 'HITCOUNT': '0.130', 'weapon5': '0.188', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'WEAPON3': '0.350', 'weapon4': '0.454', 'DAMAGECOUNT': '0.513', 'ARMOR': '0.545', 'weapon3': '0.752', 'FRAGCOUNT': '1.000', 'weapon2': '2.166'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:15,823][63770] DAMAGECOUNT value on done: 16143.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:15,823][63770] Sum rewards: -2.672, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.661', 'AMMO2': '0.003', 'AMMO5': '0.015', 'AMMO4': '0.016', 'weapon4': '0.030', 'weapon5': '0.052', 'WEAPON1': '0.060', 'HITCOUNT': '0.060', 'ARMOR': '0.090', 'AMMO3': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.518', 'weapon2': '2.034'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:16,266][63770] DAMAGECOUNT value on done: 13288.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:16,267][63770] Sum rewards: -4.346, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.184', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.015', 'WEAPON1': '0.030', 'weapon5': '0.062', 'ARMOR': '0.108', 'WEAPON5': '0.150', 'AMMO3': '0.164', 'HITCOUNT': '0.240', 'DAMAGECOUNT': '0.684', 'WEAPON3': '1.050', 'weapon2': '1.318', 'FRAGCOUNT': '2.000', 'weapon3': '2.280'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:16,295][63806] DAMAGECOUNT value on done: 14162.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:16,296][63806] Sum rewards: -1.969, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.072', 'AMMO2': '0.005', 'AMMO5': '0.025', 'AMMO4': '0.026', 'weapon5': '0.088', 'ARMOR': '0.092', 'WEAPON1': '0.120', 'AMMO3': '0.147', 'WEAPON4': '0.150', 'weapon4': '0.220', 'HITCOUNT': '0.470', 'WEAPON5': '0.500', 'WEAPON3': '0.900', 'weapon2': '1.312', 'DAMAGECOUNT': '1.581', 'weapon3': '1.966', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:16,616][63806] DAMAGECOUNT value on done: 14263.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:17,124][63734] DAMAGECOUNT value on done: 16670.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:17,125][63770] DAMAGECOUNT value on done: 13891.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:17,125][63770] Sum rewards: 2.951, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.435', 'ARMOR': '0.016', 'AMMO5': '0.030', 'AMMO2': '0.034', 'WEAPON1': '0.090', 'weapon4': '0.102', 'WEAPON4': '0.150', 'AMMO3': '0.170', 'AMMO4': '0.171', 'HITCOUNT': '0.370', 'weapon5': '0.432', 'WEAPON5': '0.500', 'WEAPON3': '0.800', 'weapon2': '1.412', 'DAMAGECOUNT': '1.545', 'weapon3': '1.564', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:17,199][63771] DAMAGECOUNT value on done: 13020.0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:17,458][109198] Fps is (10 sec: 10649.7, 60 sec: 10990.9, 300 sec: 11177.2). Total num frames: 19292160. Throughput: 0: 1053.5, 1: 1689.5. Samples: 4814410. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:17,459][109198] Avg episode reward: [(0, '-1.532'), (1, '-1.248')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:17,467][63576] Saving new best policy, reward=-1.248!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:17,498][63770] DAMAGECOUNT value on done: 15016.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:17,498][63770] Sum rewards: -4.159, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.260', 'AMMO2': '0.010', 'AMMO5': '0.023', 'AMMO4': '0.049', 'WEAPON4': '0.050', 'weapon4': '0.050', 'ARMOR': '0.068', 'WEAPON1': '0.070', 'AMMO3': '0.121', 'HITCOUNT': '0.210', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.690', 'WEAPON3': '0.800', 'weapon5': '0.838', 'FRAGCOUNT': '1.000', 'weapon2': '1.326', 'weapon3': '1.446'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:17,516][63734] DAMAGECOUNT value on done: 14585.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:17,516][63734] Sum rewards: -3.687, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.760', 'AMMO4': '-0.010', 'AMMO2': '-0.002', 'AMMO5': '0.025', 'WEAPON4': '0.100', 'WEAPON1': '0.100', 'weapon4': '0.100', 'HITCOUNT': '0.150', 'AMMO3': '0.178', 'weapon5': '0.204', 'DAMAGECOUNT': '0.495', 'WEAPON5': '0.500', 'WEAPON3': '0.650', 'weapon2': '1.510', 'weapon3': '1.822', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:17,621][63771] DAMAGECOUNT value on done: 16088.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:17,621][63771] Sum rewards: 0.364, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.920', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'AMMO5': '0.018', 'WEAPON1': '0.060', 'ARMOR': '0.080', 'AMMO3': '0.087', 'weapon5': '0.248', 'HITCOUNT': '0.250', 'WEAPON5': '0.400', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.849', 'weapon3': '1.522', 'FRAGCOUNT': '2.000', 'weapon2': '2.002'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:18,236][63733] Updated weights for policy 1, policy_version 2460 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:18,753][63767] DAMAGECOUNT value on done: 16662.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:18,754][63767] Sum rewards: 4.178, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.095', 'AMMO2': '0.007', 'AMMO5': '0.011', 'ARMOR': '0.020', 'WEAPON1': '0.020', 'AMMO4': '0.036', 'WEAPON4': '0.050', 'AMMO3': '0.104', 'weapon4': '0.132', 'WEAPON5': '0.250', 'weapon5': '0.282', 'WEAPON3': '0.650', 'HITCOUNT': '0.680', 'weapon2': '1.100', 'weapon3': '2.004', 'DAMAGECOUNT': '2.427', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:19,089][63767] DAMAGECOUNT value on done: 15900.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:19,090][63767] Sum rewards: -4.253, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.515', 'AMMO5': '0.005', 'AMMO2': '0.017', 'weapon5': '0.034', 'ARMOR': '0.040', 'HITCOUNT': '0.080', 'AMMO4': '0.085', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.127', 'DAMAGECOUNT': '0.225', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.230', 'weapon3': '2.268'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:19,351][63769] DAMAGECOUNT value on done: 17161.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:19,352][63769] Sum rewards: 3.234, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.388', 'AMMO2': '0.005', 'AMMO5': '0.018', 'AMMO4': '0.024', 'WEAPON1': '0.040', 'ARMOR': '0.040', 'weapon7': '0.082', 'WEAPON4': '0.100', 'AMMO3': '0.127', 'weapon4': '0.184', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.280', 'WEAPON5': '0.350', 'weapon5': '0.424', 'WEAPON3': '0.800', 'weapon2': '1.102', 'weapon3': '1.770', 'DAMAGECOUNT': '1.926', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:19,807][63769] DAMAGECOUNT value on done: 12084.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:19,807][63769] Sum rewards: 2.102, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.590', 'AMMO2': '0.005', 'AMMO4': '0.026', 'ARMOR': '0.028', 'AMMO5': '0.030', 'AMMO3': '0.082', 'WEAPON1': '0.090', 'WEAPON4': '0.100', 'weapon7': '0.118', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon4': '0.134', 'WEAPON7': '0.200', 'HITCOUNT': '0.270', 'WEAPON3': '0.550', 'weapon5': '0.576', 'WEAPON5': '0.600', 'DAMAGECOUNT': '1.005', 'weapon2': '1.094', 'weapon3': '1.544', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:21,135][63735] DAMAGECOUNT value on done: 15093.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:21,135][63735] Sum rewards: 0.853, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.648', 'AMMO2': '0.009', 'AMMO5': '0.015', 'ARMOR': '0.036', 'AMMO4': '0.046', 'WEAPON1': '0.050', 'weapon5': '0.078', 'AMMO3': '0.085', 'weapon4': '0.104', 'HITCOUNT': '0.140', 'WEAPON4': '0.150', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.411', 'WEAPON3': '0.600', 'weapon3': '1.502', 'weapon2': '1.974', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:21,541][63735] DAMAGECOUNT value on done: 11838.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:21,542][63735] Sum rewards: -4.243, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.232', 'AMMO2': '0.008', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO4': '0.039', 'ARMOR': '0.080', 'weapon5': '0.172', 'AMMO3': '0.197', 'WEAPON5': '0.200', 'HITCOUNT': '0.260', 'DAMAGECOUNT': '0.963', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.116', 'weapon3': '2.424'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:22,458][109198] Fps is (10 sec: 11059.1, 60 sec: 11059.2, 300 sec: 11177.2). Total num frames: 19349504. Throughput: 0: 1083.1, 1: 1646.7. Samples: 4830249. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:22,460][109198] Avg episode reward: [(0, '-1.513'), (1, '-1.104')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:22,462][63576] Saving new best policy, reward=-1.104!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:23,284][63769] DAMAGECOUNT value on done: 15181.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:23,284][63769] Sum rewards: -0.045, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.660', 'AMMO5': '0.003', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO4': '0.019', 'WEAPON5': '0.050', 'AMMO3': '0.077', 'weapon5': '0.130', 'HITCOUNT': '0.180', 'ARMOR': '0.521', 'DAMAGECOUNT': '0.540', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon2': '1.288', 'weapon3': '1.494'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:23,667][63769] DAMAGECOUNT value on done: 13018.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:23,868][63732] Updated weights for policy 0, policy_version 2260 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:25,123][63733] Updated weights for policy 1, policy_version 2470 (0.0017)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:27,078][63806] DAMAGECOUNT value on done: 13454.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:27,079][63806] Sum rewards: -1.193, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.708', 'AMMO5': '0.007', 'AMMO2': '0.011', 'WEAPON1': '0.030', 'AMMO4': '0.055', 'AMMO3': '0.100', 'WEAPON4': '0.100', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'weapon4': '0.168', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.550', 'weapon5': '0.934', 'FRAGCOUNT': '1.000', 'weapon2': '1.218', 'weapon3': '1.306'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:27,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10922.7, 300 sec: 11163.3). Total num frames: 19402752. Throughput: 0: 1116.5, 1: 1608.3. Samples: 4846677. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:27,460][109198] Avg episode reward: [(0, '-1.498'), (1, '-1.114')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:27,473][63806] DAMAGECOUNT value on done: 14891.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:27,473][63806] Sum rewards: 2.912, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.214', 'AMMO5': '0.010', 'AMMO2': '0.019', 'weapon5': '0.028', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'AMMO4': '0.092', 'AMMO3': '0.184', 'WEAPON5': '0.200', 'HITCOUNT': '0.360', 'ARMOR': '0.400', 'WEAPON3': '0.800', 'weapon2': '1.294', 'DAMAGECOUNT': '1.347', 'weapon3': '2.312', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:29,378][63805] DAMAGECOUNT value on done: 15336.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:29,378][63805] Sum rewards: -0.173, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO2': '0.005', 'AMMO5': '0.015', 'AMMO4': '0.025', 'HEALTH': '0.027', 'ARMOR': '0.042', 'AMMO3': '0.094', 'weapon5': '0.244', 'WEAPON5': '0.250', 'HITCOUNT': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.882', 'FRAGCOUNT': '1.000', 'weapon2': '1.476', 'weapon3': '1.716'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:29,782][63805] DAMAGECOUNT value on done: 13550.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:29,783][63805] Sum rewards: -0.240, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.784', 'ARMOR': '0.004', 'AMMO2': '0.018', 'AMMO5': '0.025', 'AMMO3': '0.076', 'weapon4': '0.086', 'AMMO4': '0.090', 'WEAPON1': '0.120', 'WEAPON4': '0.150', 'HITCOUNT': '0.290', 'weapon5': '0.368', 'WEAPON3': '0.500', 'WEAPON5': '0.500', 'DAMAGECOUNT': '1.125', 'weapon2': '1.294', 'weapon3': '1.398', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:30,495][63735] DAMAGECOUNT value on done: 12820.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:30,496][63735] Sum rewards: -4.927, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.572', 'AMMO4': '-0.054', 'AMMO2': '-0.011', 'AMMO5': '0.024', 'ARMOR': '0.052', 'AMMO3': '0.172', 'HITCOUNT': '0.230', 'weapon5': '0.256', 'WEAPON5': '0.400', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.329', 'weapon2': '1.348', 'weapon3': '1.998', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:30,886][63735] DAMAGECOUNT value on done: 17583.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:30,886][63735] Sum rewards: 2.792, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.620', 'AMMO2': '0.000', 'AMMO4': '0.002', 'weapon4': '0.008', 'AMMO5': '0.017', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'WEAPON1': '0.090', 'AMMO3': '0.111', 'weapon5': '0.218', 'WEAPON5': '0.350', 'HITCOUNT': '0.370', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.113', 'weapon2': '1.328', 'weapon3': '2.064', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:31,776][63732] Updated weights for policy 0, policy_version 2270 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:32,060][63733] Updated weights for policy 1, policy_version 2480 (0.0012)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:32,458][109198] Fps is (10 sec: 10649.7, 60 sec: 10922.7, 300 sec: 11177.2). Total num frames: 19456000. Throughput: 0: 1132.8, 1: 1589.1. Samples: 4854878. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:32,459][109198] Avg episode reward: [(0, '-1.406'), (1, '-1.086')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:32,461][63576] Saving new best policy, reward=-1.086!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:32,901][63734] DAMAGECOUNT value on done: 14320.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:32,901][63734] Sum rewards: -3.521, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.740', 'AMMO5': '0.012', 'AMMO2': '0.016', 'WEAPON1': '0.050', 'AMMO4': '0.078', 'AMMO3': '0.157', 'weapon5': '0.188', 'HITCOUNT': '0.250', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.912', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.308', 'weapon3': '1.998'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:33,244][63734] DAMAGECOUNT value on done: 14002.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:33,244][63734] Sum rewards: -0.327, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.732', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.013', 'ARMOR': '0.040', 'AMMO4': '0.065', 'AMMO3': '0.117', 'weapon5': '0.184', 'WEAPON5': '0.200', 'HITCOUNT': '0.450', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.308', 'weapon2': '1.692', 'weapon3': '1.814', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:35,837][63771] DAMAGECOUNT value on done: 15083.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:35,837][63771] Sum rewards: -2.859, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.052', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.016', 'AMMO5': '0.018', 'WEAPON1': '0.060', 'AMMO4': '0.080', 'AMMO3': '0.093', 'WEAPON4': '0.100', 'weapon4': '0.190', 'HITCOUNT': '0.280', 'WEAPON5': '0.350', 'WEAPON3': '0.450', 'weapon5': '0.480', 'DAMAGECOUNT': '0.744', 'weapon3': '1.150', 'weapon2': '1.432'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:36,193][63771] DAMAGECOUNT value on done: 11800.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:36,194][63771] Sum rewards: -5.705, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.946', 'AMMO5': '0.015', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'AMMO4': '0.088', 'HITCOUNT': '0.090', 'AMMO3': '0.142', 'WEAPON4': '0.150', 'weapon4': '0.174', 'WEAPON5': '0.250', 'weapon5': '0.262', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.238', 'weapon3': '1.758'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:37,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10922.7, 300 sec: 11177.2). Total num frames: 19513344. Throughput: 0: 1170.1, 1: 1557.1. Samples: 4871358. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:37,460][109198] Avg episode reward: [(0, '-1.389'), (1, '-1.065')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:37,466][63576] Saving new best policy, reward=-1.065!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:38,277][63805] DAMAGECOUNT value on done: 15892.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:38,678][63805] DAMAGECOUNT value on done: 17085.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:38,679][63805] Sum rewards: -1.442, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.775', 'AMMO5': '0.010', 'AMMO2': '0.018', 'WEAPON1': '0.060', 'AMMO4': '0.091', 'AMMO3': '0.107', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'weapon5': '0.224', 'weapon4': '0.248', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.708', 'weapon3': '1.522', 'weapon2': '1.524', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:39,083][63733] Updated weights for policy 1, policy_version 2490 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:39,251][63806] DAMAGECOUNT value on done: 14512.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:39,252][63806] Sum rewards: 1.440, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.053', 'AMMO2': '0.011', 'AMMO5': '0.028', 'weapon4': '0.038', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'AMMO4': '0.056', 'WEAPON1': '0.080', 'AMMO3': '0.140', 'weapon5': '0.204', 'HITCOUNT': '0.250', 'WEAPON5': '0.350', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.050', 'weapon2': '1.470', 'weapon3': '1.826', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:39,593][63806] DAMAGECOUNT value on done: 14503.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:39,594][63806] Sum rewards: -5.050, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.866', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO2': '0.030', 'weapon5': '0.052', 'ARMOR': '0.068', 'weapon4': '0.086', 'WEAPON5': '0.150', 'AMMO4': '0.151', 'AMMO3': '0.157', 'HITCOUNT': '0.210', 'WEAPON4': '0.400', 'DAMAGECOUNT': '0.720', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.660', 'weapon2': '1.802'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:39,818][63732] Updated weights for policy 0, policy_version 2280 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:40,166][63767] DAMAGECOUNT value on done: 16749.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:40,166][63767] Sum rewards: -1.222, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.328', 'AMMO2': '0.010', 'AMMO5': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.047', 'WEAPON4': '0.050', 'weapon4': '0.112', 'weapon5': '0.156', 'AMMO3': '0.212', 'HITCOUNT': '0.310', 'WEAPON5': '0.400', 'weapon2': '1.130', 'WEAPON3': '1.300', 'DAMAGECOUNT': '1.521', 'weapon3': '2.306', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:40,601][63767] DAMAGECOUNT value on done: 18798.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:40,602][63767] Sum rewards: -5.913, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.724', 'AMMO2': '0.006', 'ARMOR': '0.016', 'AMMO5': '0.020', 'AMMO4': '0.028', 'WEAPON4': '0.050', 'weapon4': '0.076', 'WEAPON1': '0.090', 'AMMO3': '0.104', 'weapon5': '0.160', 'HITCOUNT': '0.180', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.525', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.362', 'weapon2': '1.794'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:40,746][63770] DAMAGECOUNT value on done: 13941.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:40,746][63770] Sum rewards: -1.047, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.707', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.015', 'weapon5': '0.034', 'WEAPON5': '0.050', 'ARMOR': '0.060', 'HITCOUNT': '0.060', 'AMMO4': '0.074', 'AMMO3': '0.100', 'DAMAGECOUNT': '0.150', 'WEAPON4': '0.250', 'weapon4': '0.270', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon2': '1.416', 'weapon3': '1.668'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:41,120][63770] DAMAGECOUNT value on done: 15230.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:41,121][63770] Sum rewards: -6.784, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.162', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.018', 'AMMO2': '0.024', 'ARMOR': '0.044', 'WEAPON4': '0.050', 'WEAPON1': '0.070', 'AMMO4': '0.118', 'HITCOUNT': '0.160', 'weapon4': '0.162', 'AMMO3': '0.164', 'weapon5': '0.174', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.642', 'WEAPON3': '1.000', 'weapon2': '1.050', 'weapon3': '2.102'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:41,227][63770] DAMAGECOUNT value on done: 16233.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:41,228][63770] Sum rewards: -1.450, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.424', 'AMMO2': '0.000', 'AMMO4': '0.001', 'AMMO5': '0.010', 'AMMO3': '0.063', 'WEAPON1': '0.070', 'HITCOUNT': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.256', 'DAMAGECOUNT': '0.270', 'ARMOR': '0.400', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon3': '1.404', 'weapon2': '1.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:41,530][63767] DAMAGECOUNT value on done: 16962.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:41,530][63767] Sum rewards: -1.327, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.492', 'AMMO5': '0.010', 'ARMOR': '0.012', 'AMMO2': '0.022', 'weapon4': '0.090', 'WEAPON4': '0.100', 'AMMO4': '0.111', 'AMMO3': '0.146', 'WEAPON5': '0.150', 'weapon5': '0.198', 'HITCOUNT': '0.220', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.900', 'weapon2': '1.668', 'weapon3': '1.788', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:41,627][63770] DAMAGECOUNT value on done: 13869.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:41,628][63770] Sum rewards: 0.980, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.840', 'AMMO4': '-0.044', 'AMMO2': '-0.009', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'weapon4': '0.060', 'AMMO3': '0.122', 'weapon5': '0.220', 'WEAPON5': '0.300', 'HITCOUNT': '0.400', 'WEAPON3': '0.800', 'weapon2': '1.474', 'weapon3': '1.666', 'DAMAGECOUNT': '1.743', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:41,877][63767] DAMAGECOUNT value on done: 16232.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:41,878][63767] Sum rewards: -4.634, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.188', 'AMMO5': '0.010', 'AMMO2': '0.014', 'weapon4': '0.048', 'AMMO4': '0.068', 'ARMOR': '0.086', 'WEAPON4': '0.150', 'AMMO3': '0.162', 'weapon5': '0.166', 'WEAPON5': '0.200', 'HITCOUNT': '0.250', 'WEAPON3': '0.950', 'DAMAGECOUNT': '0.996', 'FRAGCOUNT': '1.000', 'weapon2': '1.426', 'weapon3': '2.028'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:42,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10922.7, 300 sec: 11163.3). Total num frames: 19566592. Throughput: 0: 1205.2, 1: 1519.2. Samples: 4887777. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:42,460][109198] Avg episode reward: [(0, '-1.418'), (1, '-1.225')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:42,776][63771] DAMAGECOUNT value on done: 13189.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:42,776][63771] Sum rewards: -0.064, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.564', 'AMMO5': '0.007', 'AMMO2': '0.013', 'weapon4': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.067', 'ARMOR': '0.076', 'AMMO3': '0.135', 'weapon5': '0.138', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.800', 'weapon2': '1.162', 'weapon3': '1.734', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:42,930][63734] DAMAGECOUNT value on done: 16886.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:42,930][63734] Sum rewards: -3.994, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.110', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.010', 'ARMOR': '0.024', 'weapon5': '0.074', 'AMMO3': '0.142', 'WEAPON5': '0.200', 'HITCOUNT': '0.250', 'DAMAGECOUNT': '0.648', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.470', 'weapon3': '2.186'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:43,177][63771] DAMAGECOUNT value on done: 16286.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:43,288][63734] DAMAGECOUNT value on done: 15139.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:43,288][63734] Sum rewards: 5.811, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.520', 'AMMO4': '-0.068', 'AMMO2': '-0.013', 'AMMO5': '0.010', 'weapon5': '0.032', 'ARMOR': '0.050', 'weapon4': '0.064', 'AMMO3': '0.080', 'WEAPON1': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'HITCOUNT': '0.430', 'WEAPON3': '0.550', 'weapon3': '1.478', 'DAMAGECOUNT': '1.662', 'weapon2': '1.906', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:44,646][63769] DAMAGECOUNT value on done: 17760.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:44,646][63769] Sum rewards: 5.394, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.267', 'AMMO2': '0.009', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'weapon5': '0.030', 'AMMO4': '0.043', 'AMMO3': '0.092', 'weapon4': '0.168', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'HITCOUNT': '0.420', 'ARMOR': '0.452', 'WEAPON3': '0.700', 'weapon2': '1.552', 'weapon3': '1.710', 'DAMAGECOUNT': '1.797', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:45,053][63769] DAMAGECOUNT value on done: 12175.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:45,053][63769] Sum rewards: 0.520, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.583', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.023', 'ARMOR': '0.024', 'WEAPON1': '0.050', 'AMMO3': '0.079', 'HITCOUNT': '0.110', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.273', 'WEAPON3': '0.450', 'weapon5': '0.694', 'FRAGCOUNT': '1.000', 'weapon3': '1.320', 'weapon2': '1.418'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:46,140][63735] DAMAGECOUNT value on done: 15303.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:46,371][63769] DAMAGECOUNT value on done: 15385.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:46,372][63769] Sum rewards: -0.503, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.010', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'AMMO5': '0.017', 'WEAPON1': '0.040', 'ARMOR': '0.054', 'WEAPON4': '0.100', 'AMMO3': '0.127', 'weapon4': '0.208', 'HITCOUNT': '0.210', 'WEAPON5': '0.400', 'weapon5': '0.492', 'DAMAGECOUNT': '0.612', 'WEAPON3': '0.900', 'weapon2': '1.104', 'weapon3': '1.790', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:46,459][63733] Updated weights for policy 1, policy_version 2500 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:46,515][63735] DAMAGECOUNT value on done: 12438.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:46,516][63735] Sum rewards: 1.430, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.242', 'AMMO5': '0.007', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'ARMOR': '0.028', 'AMMO4': '0.061', 'weapon5': '0.080', 'WEAPON5': '0.100', 'AMMO3': '0.183', 'HITCOUNT': '0.380', 'WEAPON3': '0.950', 'weapon2': '1.236', 'DAMAGECOUNT': '1.800', 'weapon3': '2.314', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:46,763][63769] DAMAGECOUNT value on done: 13234.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:46,763][63769] Sum rewards: -4.530, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.705', 'AMMO2': '0.002', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.010', 'weapon5': '0.020', 'ARMOR': '0.056', 'weapon7': '0.080', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.130', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.648', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.620', 'weapon3': '1.668'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:47,410][63732] Updated weights for policy 0, policy_version 2290 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:47,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10922.7, 300 sec: 11163.3). Total num frames: 19623936. Throughput: 0: 1221.0, 1: 1498.0. Samples: 4895754. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:47,459][109198] Avg episode reward: [(0, '-1.281'), (1, '-1.153')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:51,910][63806] DAMAGECOUNT value on done: 13577.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:51,911][63806] Sum rewards: -1.066, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-1.125', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.008', 'AMMO5': '0.009', 'weapon5': '0.032', 'AMMO4': '0.040', 'weapon4': '0.044', 'AMMO3': '0.060', 'WEAPON1': '0.060', 'WEAPON4': '0.100', 'HITCOUNT': '0.130', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.369', 'WEAPON3': '0.450', 'weapon3': '1.346', 'weapon2': '1.460'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:52,285][63806] DAMAGECOUNT value on done: 15133.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:52,286][63806] Sum rewards: -2.278, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.524', 'AMMO4': '-0.055', 'AMMO2': '-0.011', 'weapon5': '0.014', 'AMMO5': '0.015', 'WEAPON1': '0.080', 'AMMO3': '0.143', 'HITCOUNT': '0.190', 'WEAPON5': '0.300', 'ARMOR': '0.508', 'DAMAGECOUNT': '0.726', 'WEAPON3': '0.800', 'weapon2': '1.092', 'weapon3': '1.944', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:52,458][109198] Fps is (10 sec: 10649.5, 60 sec: 10854.4, 300 sec: 11149.5). Total num frames: 19673088. Throughput: 0: 1254.5, 1: 1461.7. Samples: 4912019. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:52,460][109198] Avg episode reward: [(0, '-1.282'), (1, '-1.150')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:54,027][63733] Updated weights for policy 1, policy_version 2510 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:54,507][63805] DAMAGECOUNT value on done: 15671.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:54,508][63805] Sum rewards: 2.929, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.086', 'AMMO5': '0.010', 'AMMO2': '0.020', 'WEAPON1': '0.030', 'AMMO4': '0.101', 'AMMO3': '0.110', 'HITCOUNT': '0.130', 'weapon5': '0.136', 'WEAPON5': '0.200', 'ARMOR': '0.416', 'WEAPON3': '0.550', 'DAMAGECOUNT': '1.005', 'weapon2': '1.220', 'weapon3': '2.086', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:54,903][63805] DAMAGECOUNT value on done: 14057.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:54,904][63805] Sum rewards: 0.108, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.783', 'AMMO2': '0.010', 'AMMO5': '0.017', 'ARMOR': '0.040', 'weapon4': '0.040', 'weapon7': '0.046', 'WEAPON4': '0.050', 'AMMO4': '0.052', 'WEAPON1': '0.070', 'weapon5': '0.100', 'AMMO3': '0.128', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.330', 'WEAPON5': '0.350', 'WEAPON3': '0.900', 'weapon2': '1.252', 'DAMAGECOUNT': '1.521', 'weapon3': '2.134', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:54,984][63732] Updated weights for policy 0, policy_version 2300 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:55,640][63735] DAMAGECOUNT value on done: 13255.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:55,640][63735] Sum rewards: 2.317, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.463', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'ARMOR': '0.032', 'AMMO3': '0.101', 'WEAPON5': '0.150', 'HITCOUNT': '0.240', 'weapon5': '0.348', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.305', 'weapon2': '1.462', 'weapon3': '1.780', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:56,046][63735] DAMAGECOUNT value on done: 17804.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:56,046][63735] Sum rewards: -1.224, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO5': '0.007', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.050', 'AMMO4': '0.092', 'WEAPON4': '0.100', 'weapon4': '0.102', 'AMMO3': '0.103', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'weapon5': '0.184', 'WEAPON3': '0.550', 'HEALTH': '0.592', 'DAMAGECOUNT': '0.663', 'FRAGCOUNT': '1.000', 'weapon2': '1.446', 'weapon3': '1.808'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:57,458][109198] Fps is (10 sec: 10649.5, 60 sec: 10922.7, 300 sec: 11149.4). Total num frames: 19730432. Throughput: 0: 1280.8, 1: 1439.0. Samples: 4928526. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:05:57,460][109198] Avg episode reward: [(0, '-1.208'), (1, '-1.124')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:58,530][63734] DAMAGECOUNT value on done: 14430.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:58,531][63734] Sum rewards: -3.992, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.152', 'AMMO2': '0.011', 'AMMO5': '0.025', 'weapon4': '0.030', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'WEAPON1': '0.050', 'AMMO4': '0.055', 'AMMO3': '0.075', 'HITCOUNT': '0.100', 'weapon5': '0.224', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.400', 'WEAPON5': '0.450', 'weapon3': '1.510', 'weapon2': '1.818'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:58,911][63734] DAMAGECOUNT value on done: 14343.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:05:58,911][63734] Sum rewards: -0.699, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.102', 'AMMO2': '0.005', 'AMMO5': '0.005', 'AMMO4': '0.022', 'ARMOR': '0.036', 'WEAPON1': '0.040', 'AMMO3': '0.152', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'weapon5': '0.272', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.023', 'weapon2': '1.046', 'weapon3': '2.092', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:01,102][63805] DAMAGECOUNT value on done: 15962.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:01,255][63771] DAMAGECOUNT value on done: 15308.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:01,256][63771] Sum rewards: -1.546, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.490', 'AMMO2': '0.004', 'weapon7': '0.016', 'AMMO5': '0.020', 'AMMO4': '0.021', 'weapon5': '0.068', 'ARMOR': '0.070', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON1': '0.100', 'AMMO3': '0.112', 'weapon4': '0.114', 'WEAPON4': '0.150', 'HITCOUNT': '0.210', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.700', 'weapon2': '1.132', 'FRAGCOUNT': '2.000', 'weapon3': '2.102'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:01,477][63805] DAMAGECOUNT value on done: 17405.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:01,478][63805] Sum rewards: 1.900, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.032', 'ARMOR': '0.048', 'WEAPON5': '0.050', 'AMMO3': '0.116', 'AMMO4': '0.161', 'weapon4': '0.218', 'HITCOUNT': '0.250', 'WEAPON4': '0.300', 'HEALTH': '0.470', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.960', 'weapon3': '1.480', 'weapon2': '1.802', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:01,493][63733] Updated weights for policy 1, policy_version 2520 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:01,715][63771] DAMAGECOUNT value on done: 12075.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:01,715][63771] Sum rewards: -5.203, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.074', 'AMMO4': '-0.024', 'AMMO2': '-0.005', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'weapon5': '0.014', 'ARMOR': '0.060', 'AMMO3': '0.195', 'WEAPON5': '0.200', 'HITCOUNT': '0.290', 'DAMAGECOUNT': '0.825', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.100', 'weapon2': '1.342', 'weapon3': '2.354'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:01,772][63806] DAMAGECOUNT value on done: 14558.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:01,772][63806] Sum rewards: -5.624, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.394', 'AMMO5': '0.007', 'AMMO2': '0.009', 'WEAPON1': '0.020', 'ARMOR': '0.028', 'AMMO4': '0.043', 'HITCOUNT': '0.080', 'AMMO3': '0.129', 'DAMAGECOUNT': '0.138', 'WEAPON5': '0.150', 'weapon5': '0.322', 'WEAPON3': '0.550', 'weapon3': '1.258', 'weapon2': '1.786'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:02,095][63806] DAMAGECOUNT value on done: 14863.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:02,096][63806] Sum rewards: -2.390, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.900', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'AMMO5': '0.020', 'WEAPON1': '0.100', 'AMMO3': '0.150', 'weapon5': '0.258', 'HITCOUNT': '0.320', 'WEAPON5': '0.400', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.080', 'weapon2': '1.254', 'FRAGCOUNT': '2.000', 'weapon3': '2.086'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:02,458][109198] Fps is (10 sec: 11059.3, 60 sec: 10922.7, 300 sec: 11149.5). Total num frames: 19783680. Throughput: 0: 1291.5, 1: 1426.5. Samples: 4936721. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:02,460][109198] Avg episode reward: [(0, '-1.313'), (1, '-1.165')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:02,470][63732] Updated weights for policy 0, policy_version 2310 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:04,319][63767] DAMAGECOUNT value on done: 17262.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:04,320][63767] Sum rewards: -2.326, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.060', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.019', 'WEAPON1': '0.030', 'weapon5': '0.052', 'WEAPON4': '0.100', 'AMMO3': '0.135', 'weapon7': '0.154', 'weapon4': '0.174', 'HITCOUNT': '0.250', 'AMMO6': '0.300', 'WEAPON7': '0.300', 'AMMO7': '0.300', 'WEAPON5': '0.400', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.026', 'weapon3': '1.940'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:04,685][63767] DAMAGECOUNT value on done: 16562.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:04,685][63767] Sum rewards: -2.429, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.380', 'AMMO4': '-0.029', 'AMMO2': '-0.006', 'AMMO5': '0.003', 'WEAPON1': '0.030', 'weapon5': '0.056', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.167', 'weapon4': '0.198', 'HITCOUNT': '0.280', 'ARMOR': '0.516', 'WEAPON3': '0.950', 'DAMAGECOUNT': '0.990', 'weapon2': '1.254', 'weapon3': '2.092', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:05,265][63767] DAMAGECOUNT value on done: 17262.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:05,265][63767] Sum rewards: -0.736, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.030', 'AMMO2': '0.005', 'AMMO5': '0.014', 'AMMO4': '0.023', 'weapon5': '0.090', 'WEAPON4': '0.100', 'weapon4': '0.102', 'AMMO3': '0.155', 'WEAPON5': '0.300', 'HITCOUNT': '0.390', 'ARMOR': '0.488', 'WEAPON3': '0.950', 'weapon2': '0.956', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.539', 'weapon3': '2.432'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:05,663][63767] DAMAGECOUNT value on done: 18861.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:06,359][63770] DAMAGECOUNT value on done: 14100.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:06,359][63770] Sum rewards: -1.328, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.332', 'AMMO2': '0.008', 'AMMO5': '0.013', 'AMMO4': '0.041', 'ARMOR': '0.112', 'AMMO3': '0.122', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'WEAPON5': '0.250', 'weapon5': '0.368', 'weapon4': '0.390', 'DAMAGECOUNT': '0.477', 'WEAPON3': '0.650', 'weapon2': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.392'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:06,743][63770] DAMAGECOUNT value on done: 15344.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:06,743][63770] Sum rewards: -3.997, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.086', 'AMMO5': '0.020', 'weapon4': '0.028', 'AMMO2': '0.033', 'WEAPON1': '0.070', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.155', 'AMMO4': '0.166', 'weapon5': '0.260', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.342', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.154', 'weapon3': '2.100'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:06,823][63770] DAMAGECOUNT value on done: 16404.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:06,823][63770] Sum rewards: -0.230, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.293', 'AMMO2': '0.011', 'AMMO5': '0.013', 'ARMOR': '0.024', 'WEAPON1': '0.050', 'AMMO4': '0.055', 'AMMO3': '0.101', 'HITCOUNT': '0.150', 'weapon5': '0.190', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.513', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.464', 'weapon3': '1.792'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:07,223][63770] DAMAGECOUNT value on done: 14687.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:07,223][63770] Sum rewards: 2.531, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.662', 'AMMO2': '0.014', 'AMMO5': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.071', 'weapon7': '0.084', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.115', 'weapon4': '0.210', 'WEAPON5': '0.300', 'weapon5': '0.378', 'ARMOR': '0.440', 'WEAPON3': '0.500', 'HITCOUNT': '0.590', 'weapon2': '1.054', 'weapon3': '1.612', 'DAMAGECOUNT': '2.454', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:07,458][109198] Fps is (10 sec: 11059.3, 60 sec: 10922.7, 300 sec: 11149.5). Total num frames: 19841024. Throughput: 0: 1320.8, 1: 1412.5. Samples: 4953245. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:07,460][109198] Avg episode reward: [(0, '-1.282'), (1, '-1.210')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:08,195][63771] DAMAGECOUNT value on done: 13356.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:08,482][63734] DAMAGECOUNT value on done: 17171.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:08,483][63734] Sum rewards: 1.297, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.156', 'AMMO5': '0.005', 'AMMO2': '0.008', 'weapon5': '0.034', 'WEAPON1': '0.040', 'AMMO4': '0.042', 'WEAPON5': '0.100', 'AMMO3': '0.105', 'HITCOUNT': '0.140', 'ARMOR': '0.502', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.855', 'weapon2': '1.062', 'weapon3': '1.910', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:08,596][63771] DAMAGECOUNT value on done: 16716.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:08,596][63771] Sum rewards: 0.161, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.538', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'ARMOR': '0.024', 'AMMO5': '0.025', 'WEAPON1': '0.070', 'AMMO3': '0.084', 'weapon5': '0.244', 'HITCOUNT': '0.380', 'WEAPON5': '0.500', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.290', 'weapon2': '1.394', 'weapon3': '1.896'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:08,874][63734] DAMAGECOUNT value on done: 15343.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:08,874][63734] Sum rewards: 0.625, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.786', 'AMMO2': '0.011', 'AMMO5': '0.023', 'ARMOR': '0.028', 'weapon5': '0.038', 'AMMO4': '0.057', 'weapon7': '0.068', 'WEAPON1': '0.070', 'WEAPON4': '0.100', 'AMMO3': '0.104', 'weapon4': '0.112', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.170', 'WEAPON7': '0.200', 'WEAPON5': '0.350', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.612', 'FRAGCOUNT': '1.000', 'weapon3': '1.374', 'weapon2': '1.554'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:08,890][63733] Updated weights for policy 1, policy_version 2530 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:09,603][63769] DAMAGECOUNT value on done: 15612.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:09,603][63769] Sum rewards: -0.819, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.850', 'weapon4': '0.004', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'AMMO5': '0.018', 'AMMO4': '0.084', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON4': '0.100', 'weapon7': '0.106', 'HITCOUNT': '0.120', 'AMMO3': '0.125', 'weapon5': '0.256', 'WEAPON5': '0.350', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.681', 'weapon3': '1.436', 'FRAGCOUNT': '1.500', 'weapon2': '1.824'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:09,968][63732] Updated weights for policy 0, policy_version 2320 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:09,968][63769] DAMAGECOUNT value on done: 13699.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:09,969][63769] Sum rewards: -0.606, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.230', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.021', 'AMMO4': '0.033', 'AMMO3': '0.181', 'weapon5': '0.208', 'WEAPON5': '0.300', 'HITCOUNT': '0.330', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.395', 'weapon2': '1.456', 'weapon3': '1.918', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:10,090][63769] DAMAGECOUNT value on done: 18244.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:10,091][63769] Sum rewards: 0.117, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.214', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'weapon5': '0.028', 'ARMOR': '0.043', 'WEAPON5': '0.050', 'AMMO3': '0.084', 'WEAPON4': '0.100', 'weapon4': '0.104', 'HITCOUNT': '0.370', 'WEAPON3': '0.650', 'weapon2': '1.258', 'DAMAGECOUNT': '1.452', 'weapon3': '1.930', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:10,482][63769] DAMAGECOUNT value on done: 12320.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:10,482][63769] Sum rewards: -1.110, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.780', 'AMMO5': '0.007', 'AMMO2': '0.034', 'weapon4': '0.042', 'ARMOR': '0.068', 'WEAPON1': '0.070', 'HITCOUNT': '0.120', 'AMMO3': '0.131', 'weapon5': '0.164', 'AMMO4': '0.170', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.246', 'weapon3': '1.832'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:11,246][63735] DAMAGECOUNT value on done: 15353.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:11,620][63735] DAMAGECOUNT value on done: 12883.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:11,621][63735] Sum rewards: -2.409, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.442', 'AMMO2': '0.012', 'AMMO5': '0.015', 'weapon7': '0.022', 'AMMO4': '0.057', 'ARMOR': '0.068', 'weapon5': '0.082', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.120', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'weapon4': '0.218', 'WEAPON5': '0.300', 'WEAPON3': '0.750', 'weapon2': '1.236', 'DAMAGECOUNT': '1.335', 'weapon3': '1.888', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:12,459][109198] Fps is (10 sec: 11058.8, 60 sec: 10922.6, 300 sec: 11149.4). Total num frames: 19894272. Throughput: 0: 1337.3, 1: 1397.5. Samples: 4969744. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:12,461][109198] Avg episode reward: [(0, '-1.285'), (1, '-1.240')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:16,287][63733] Updated weights for policy 1, policy_version 2540 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:16,371][63806] DAMAGECOUNT value on done: 14012.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:16,371][63806] Sum rewards: 0.063, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.308', 'weapon4': '0.002', 'AMMO2': '0.009', 'AMMO5': '0.018', 'ARMOR': '0.024', 'AMMO4': '0.043', 'WEAPON4': '0.050', 'WEAPON1': '0.070', 'AMMO3': '0.095', 'weapon5': '0.240', 'WEAPON5': '0.250', 'HITCOUNT': '0.350', 'WEAPON3': '0.500', 'weapon3': '1.236', 'DAMAGECOUNT': '1.305', 'weapon2': '1.680', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:16,739][63806] DAMAGECOUNT value on done: 15275.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:16,739][63806] Sum rewards: 2.346, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-0.487', 'AMMO5': '0.005', 'AMMO2': '0.005', 'weapon4': '0.010', 'AMMO4': '0.027', 'AMMO3': '0.040', 'WEAPON4': '0.050', 'WEAPON1': '0.070', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.118', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'weapon5': '0.278', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.426', 'FRAGCOUNT': '1.000', 'weapon3': '1.152', 'weapon2': '1.732'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:17,432][63732] Updated weights for policy 0, policy_version 2330 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:17,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10990.9, 300 sec: 11149.5). Total num frames: 19951616. Throughput: 0: 1344.1, 1: 1391.6. Samples: 4977983. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:17,459][109198] Avg episode reward: [(0, '-1.289'), (1, '-1.248')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:19,190][63805] DAMAGECOUNT value on done: 16181.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:19,190][63805] Sum rewards: -1.101, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.120', 'AMMO2': '0.001', 'AMMO4': '0.006', 'AMMO5': '0.006', 'ARMOR': '0.016', 'weapon7': '0.052', 'weapon5': '0.058', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.150', 'AMMO3': '0.156', 'HITCOUNT': '0.300', 'WEAPON3': '0.900', 'weapon2': '1.406', 'DAMAGECOUNT': '1.530', 'weapon3': '2.138', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:19,635][63805] DAMAGECOUNT value on done: 14204.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:20,709][63735] DAMAGECOUNT value on done: 13679.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:20,709][63735] Sum rewards: -0.019, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.270', 'AMMO4': '-0.046', 'AMMO2': '-0.009', 'AMMO5': '0.014', 'ARMOR': '0.040', 'weapon7': '0.052', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon5': '0.140', 'AMMO3': '0.148', 'WEAPON7': '0.200', 'weapon4': '0.206', 'HITCOUNT': '0.230', 'WEAPON5': '0.350', 'WEAPON3': '0.950', 'weapon2': '0.996', 'DAMAGECOUNT': '1.272', 'weapon3': '2.118', 'FRAGCOUNT': '3.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:21,109][63735] DAMAGECOUNT value on done: 18359.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:21,110][63735] Sum rewards: 0.028, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.086', 'AMMO2': '0.020', 'AMMO5': '0.025', 'WEAPON1': '0.030', 'weapon4': '0.036', 'weapon5': '0.060', 'ARMOR': '0.078', 'AMMO3': '0.098', 'AMMO4': '0.101', 'WEAPON4': '0.250', 'WEAPON5': '0.400', 'HITCOUNT': '0.410', 'WEAPON3': '0.500', 'weapon3': '1.436', 'DAMAGECOUNT': '1.665', 'weapon2': '2.004', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:22,458][109198] Fps is (10 sec: 11059.5, 60 sec: 10922.7, 300 sec: 11149.4). Total num frames: 20004864. Throughput: 0: 1356.4, 1: 1379.8. Samples: 4994490. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:22,460][109198] Avg episode reward: [(0, '-1.249'), (1, '-1.277')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:23,657][63805] DAMAGECOUNT value on done: 16070.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:23,658][63805] Sum rewards: -0.064, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.280', 'AMMO5': '0.007', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'weapon5': '0.024', 'ARMOR': '0.032', 'AMMO4': '0.088', 'AMMO3': '0.106', 'weapon4': '0.114', 'HITCOUNT': '0.120', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.324', 'WEAPON3': '0.600', 'weapon2': '1.166', 'FRAGCOUNT': '2.000', 'weapon3': '2.046'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:23,705][63733] Updated weights for policy 1, policy_version 2550 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:23,859][63734] DAMAGECOUNT value on done: 14785.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:23,860][63734] Sum rewards: -2.748, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.846', 'AMMO5': '0.009', 'AMMO2': '0.032', 'WEAPON1': '0.050', 'AMMO3': '0.081', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO4': '0.159', 'weapon4': '0.176', 'WEAPON5': '0.200', 'weapon5': '0.208', 'HITCOUNT': '0.260', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'FRAGCOUNT': '0.500', 'ARMOR': '0.522', 'weapon3': '0.974', 'DAMAGECOUNT': '1.065', 'weapon2': '1.862'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:24,020][63805] DAMAGECOUNT value on done: 17698.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:24,021][63805] Sum rewards: -4.003, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.350', 'ARMOR': '0.008', 'AMMO5': '0.013', 'AMMO2': '0.023', 'weapon7': '0.048', 'WEAPON1': '0.060', 'weapon4': '0.074', 'AMMO3': '0.075', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO4': '0.115', 'weapon5': '0.136', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'WEAPON4': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.879', 'FRAGCOUNT': '1.000', 'weapon3': '1.482', 'weapon2': '1.594'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:24,213][63806] DAMAGECOUNT value on done: 14727.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:24,214][63806] Sum rewards: -6.119, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.172', 'AMMO5': '0.013', 'weapon5': '0.014', 'AMMO2': '0.023', 'weapon4': '0.032', 'WEAPON1': '0.040', 'ARMOR': '0.101', 'AMMO4': '0.114', 'AMMO3': '0.158', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.162', 'weapon3': '2.310'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:24,265][63734] DAMAGECOUNT value on done: 14810.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:24,266][63734] Sum rewards: 1.240, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.036', 'AMMO2': '0.005', 'AMMO5': '0.022', 'AMMO4': '0.026', 'ARMOR': '0.036', 'WEAPON1': '0.050', 'WEAPON4': '0.050', 'weapon4': '0.052', 'weapon5': '0.068', 'AMMO3': '0.169', 'HITCOUNT': '0.290', 'WEAPON5': '0.450', 'weapon2': '0.860', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.401', 'weapon3': '2.396', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:24,648][63806] DAMAGECOUNT value on done: 15236.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:24,648][63806] Sum rewards: 0.732, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.166', 'AMMO5': '0.010', 'AMMO2': '0.021', 'WEAPON1': '0.040', 'AMMO4': '0.106', 'AMMO3': '0.140', 'WEAPON5': '0.200', 'HITCOUNT': '0.300', 'weapon5': '0.360', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.119', 'weapon3': '1.372', 'weapon2': '1.730', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:24,887][63732] Updated weights for policy 0, policy_version 2340 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:26,664][63771] DAMAGECOUNT value on done: 15470.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:27,047][63767] DAMAGECOUNT value on done: 17672.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:27,047][63767] Sum rewards: -0.626, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.401', 'AMMO5': '0.010', 'AMMO2': '0.013', 'ARMOR': '0.048', 'AMMO4': '0.065', 'weapon5': '0.116', 'AMMO3': '0.131', 'WEAPON5': '0.150', 'HITCOUNT': '0.290', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.230', 'weapon2': '1.292', 'weapon3': '2.330'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:27,091][63771] DAMAGECOUNT value on done: 12212.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:27,092][63771] Sum rewards: 1.601, reward structure: {'DEATHCOUNT': '-2.250', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.308', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO2': '0.024', 'weapon7': '0.048', 'weapon5': '0.054', 'HITCOUNT': '0.080', 'AMMO3': '0.088', 'WEAPON5': '0.100', 'AMMO4': '0.120', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.204', 'WEAPON3': '0.250', 'DAMAGECOUNT': '0.411', 'ARMOR': '0.471', 'weapon2': '0.502', 'weapon3': '1.640'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:27,461][109198] Fps is (10 sec: 10646.4, 60 sec: 10922.1, 300 sec: 11135.5). Total num frames: 20058112. Throughput: 0: 1362.4, 1: 1367.7. Samples: 5010640. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:27,465][109198] Avg episode reward: [(0, '-1.225'), (1, '-1.418')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:27,469][63767] DAMAGECOUNT value on done: 16827.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:27,470][63767] Sum rewards: 1.357, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.682', 'AMMO5': '0.015', 'AMMO2': '0.022', 'WEAPON1': '0.050', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'weapon7': '0.100', 'AMMO3': '0.104', 'AMMO4': '0.107', 'weapon5': '0.172', 'WEAPON5': '0.200', 'HITCOUNT': '0.220', 'weapon4': '0.220', 'WEAPON4': '0.250', 'ARMOR': '0.424', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.795', 'weapon2': '0.978', 'weapon3': '2.032', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:27,475][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002343_9596928.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:27,475][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000002554_10461184.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:27,535][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000002155_8826880.pth\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:27,539][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002092_8568832.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:30,131][63767] DAMAGECOUNT value on done: 17453.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:30,131][63767] Sum rewards: -1.779, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.929', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'weapon5': '0.038', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'weapon7': '0.050', 'AMMO3': '0.102', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.160', 'WEAPON7': '0.200', 'WEAPON4': '0.250', 'weapon4': '0.382', 'DAMAGECOUNT': '0.573', 'WEAPON3': '0.750', 'weapon2': '0.806', 'FRAGCOUNT': '1.000', 'weapon3': '1.498'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:30,534][63767] DAMAGECOUNT value on done: 19110.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:30,534][63767] Sum rewards: -0.990, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.696', 'AMMO5': '0.017', 'AMMO2': '0.019', 'weapon4': '0.044', 'ARMOR': '0.048', 'WEAPON1': '0.050', 'AMMO4': '0.097', 'AMMO3': '0.115', 'HITCOUNT': '0.180', 'weapon5': '0.194', 'WEAPON4': '0.200', 'WEAPON5': '0.350', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.747', 'weapon3': '1.598', 'weapon2': '1.646', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:31,492][63733] Updated weights for policy 1, policy_version 2560 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:31,887][63770] DAMAGECOUNT value on done: 14456.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:31,888][63770] Sum rewards: -0.462, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO2': '0.027', 'WEAPON4': '0.050', 'ARMOR': '0.088', 'AMMO4': '0.134', 'AMMO3': '0.151', 'weapon4': '0.190', 'HITCOUNT': '0.370', 'HEALTH': '0.622', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.068', 'weapon2': '1.340', 'weapon3': '2.098'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:32,277][63770] DAMAGECOUNT value on done: 15474.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:32,277][63770] Sum rewards: -3.823, reward structure: {'DEATHCOUNT': '-10.500', 'AMMO5': '0.020', 'AMMO2': '0.022', 'weapon4': '0.034', 'ARMOR': '0.040', 'WEAPON1': '0.040', 'weapon5': '0.078', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.109', 'AMMO3': '0.120', 'HEALTH': '0.280', 'DAMAGECOUNT': '0.390', 'WEAPON5': '0.400', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.532', 'weapon3': '1.812'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:32,362][63770] DAMAGECOUNT value on done: 16704.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:32,362][63770] Sum rewards: -0.902, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.808', 'ARMOR': '0.008', 'AMMO5': '0.022', 'AMMO2': '0.031', 'WEAPON1': '0.050', 'weapon4': '0.058', 'AMMO3': '0.115', 'AMMO4': '0.155', 'HITCOUNT': '0.200', 'weapon5': '0.224', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.900', 'weapon2': '1.272', 'weapon3': '1.820', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:32,458][109198] Fps is (10 sec: 10649.7, 60 sec: 10922.7, 300 sec: 11121.7). Total num frames: 20111360. Throughput: 0: 1362.4, 1: 1368.8. Samples: 5018660. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:32,460][109198] Avg episode reward: [(0, '-1.228'), (1, '-1.423')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:32,590][63732] Updated weights for policy 0, policy_version 2350 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:32,749][63770] DAMAGECOUNT value on done: 15249.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:32,749][63770] Sum rewards: 1.532, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.478', 'AMMO2': '0.008', 'weapon4': '0.010', 'AMMO5': '0.014', 'weapon5': '0.034', 'AMMO4': '0.039', 'WEAPON4': '0.050', 'WEAPON1': '0.060', 'AMMO3': '0.122', 'HITCOUNT': '0.300', 'WEAPON5': '0.300', 'ARMOR': '0.432', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.500', 'weapon2': '1.550', 'DAMAGECOUNT': '1.665', 'weapon3': '1.976'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:32,931][63769] DAMAGECOUNT value on done: 15695.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:33,327][63769] DAMAGECOUNT value on done: 13948.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:33,328][63769] Sum rewards: -6.397, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.152', 'ARMOR': '0.008', 'AMMO2': '0.013', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.067', 'weapon5': '0.112', 'HITCOUNT': '0.180', 'AMMO3': '0.191', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.747', 'weapon2': '1.588', 'weapon3': '1.914'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:33,813][63771] DAMAGECOUNT value on done: 13702.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:33,814][63771] Sum rewards: 1.159, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.454', 'AMMO5': '0.010', 'AMMO2': '0.011', 'WEAPON1': '0.030', 'AMMO4': '0.055', 'weapon7': '0.076', 'AMMO3': '0.097', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.220', 'HITCOUNT': '0.240', 'ARMOR': '0.620', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.038', 'weapon2': '1.400', 'weapon3': '1.826', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:34,069][63734] DAMAGECOUNT value on done: 17425.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:34,069][63734] Sum rewards: 1.694, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.170', 'AMMO5': '0.005', 'AMMO2': '0.009', 'AMMO4': '0.046', 'AMMO3': '0.118', 'HITCOUNT': '0.120', 'WEAPON5': '0.150', 'weapon5': '0.168', 'ARMOR': '0.416', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.762', 'weapon2': '1.272', 'weapon3': '1.548', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:34,193][63771] DAMAGECOUNT value on done: 16958.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:34,194][63771] Sum rewards: -1.688, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.017', 'AMMO2': '0.016', 'weapon4': '0.016', 'AMMO5': '0.028', 'ARMOR': '0.040', 'weapon5': '0.074', 'AMMO4': '0.078', 'WEAPON1': '0.090', 'AMMO3': '0.102', 'WEAPON4': '0.150', 'HITCOUNT': '0.180', 'WEAPON5': '0.550', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.726', 'FRAGCOUNT': '1.000', 'weapon2': '1.320', 'weapon3': '1.810'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:34,475][63734] DAMAGECOUNT value on done: 15463.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:34,573][63770] Large shaping reward 2.614 for [('FRAGCOUNT', 2.0, 2.0), ('HITCOUNT', 0.03, 3.0), ('DAMAGECOUNT', 0.582, 194.0), ('weapon7', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:35,610][63769] DAMAGECOUNT value on done: 18427.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:35,610][63769] Sum rewards: -1.440, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.668', 'AMMO2': '0.009', 'AMMO5': '0.024', 'WEAPON1': '0.030', 'AMMO4': '0.047', 'WEAPON4': '0.050', 'weapon5': '0.060', 'weapon7': '0.070', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'ARMOR': '0.104', 'HITCOUNT': '0.130', 'AMMO3': '0.137', 'weapon4': '0.202', 'WEAPON5': '0.500', 'DAMAGECOUNT': '0.549', 'WEAPON3': '0.750', 'weapon2': '0.972', 'weapon3': '1.544', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:36,019][63769] DAMAGECOUNT value on done: 12486.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:36,019][63769] Sum rewards: -2.940, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.348', 'weapon4': '0.006', 'AMMO5': '0.013', 'AMMO2': '0.034', 'weapon5': '0.058', 'WEAPON1': '0.080', 'AMMO3': '0.106', 'HITCOUNT': '0.140', 'AMMO4': '0.167', 'WEAPON5': '0.250', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.498', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.570', 'weapon3': '1.786'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:36,490][63735] DAMAGECOUNT value on done: 15522.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:36,490][63735] Sum rewards: -3.746, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.560', 'weapon4': '0.002', 'AMMO2': '0.015', 'AMMO5': '0.025', 'AMMO4': '0.076', 'WEAPON1': '0.080', 'HITCOUNT': '0.120', 'AMMO3': '0.143', 'WEAPON4': '0.200', 'weapon5': '0.314', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.378', 'weapon3': '1.404'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:36,883][63735] DAMAGECOUNT value on done: 13097.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:36,883][63735] Sum rewards: -4.025, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.143', 'AMMO2': '0.006', 'AMMO5': '0.012', 'weapon7': '0.016', 'AMMO4': '0.030', 'ARMOR': '0.044', 'WEAPON4': '0.050', 'WEAPON1': '0.050', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.118', 'weapon4': '0.134', 'HITCOUNT': '0.180', 'weapon5': '0.248', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.642', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.016', 'weapon3': '2.022'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:37,458][109198] Fps is (10 sec: 11062.5, 60 sec: 10922.7, 300 sec: 11135.6). Total num frames: 20168704. Throughput: 0: 1361.1, 1: 1370.5. Samples: 5034943. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:37,460][109198] Avg episode reward: [(0, '-1.387'), (1, '-1.419')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:38,913][63733] Updated weights for policy 1, policy_version 2570 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:40,126][63732] Updated weights for policy 0, policy_version 2360 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:41,007][63806] DAMAGECOUNT value on done: 14431.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:41,008][63806] Sum rewards: 2.199, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.406', 'weapon4': '0.012', 'AMMO5': '0.012', 'AMMO2': '0.021', 'ARMOR': '0.036', 'WEAPON1': '0.070', 'WEAPON4': '0.100', 'AMMO4': '0.103', 'AMMO3': '0.130', 'HITCOUNT': '0.210', 'weapon5': '0.266', 'WEAPON5': '0.300', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.257', 'weapon3': '1.474', 'weapon2': '1.614', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:41,426][63806] DAMAGECOUNT value on done: 15694.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:41,427][63806] Sum rewards: 0.776, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.754', 'AMMO2': '0.004', 'AMMO5': '0.007', 'weapon5': '0.018', 'WEAPON1': '0.020', 'AMMO4': '0.022', 'ARMOR': '0.044', 'AMMO3': '0.119', 'WEAPON5': '0.150', 'HITCOUNT': '0.350', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.257', 'weapon2': '1.440', 'weapon3': '1.848', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:42,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10922.7, 300 sec: 11121.7). Total num frames: 20221952. Throughput: 0: 1360.5, 1: 1368.8. Samples: 5051346. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:42,459][109198] Avg episode reward: [(0, '-1.358'), (1, '-1.375')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:44,518][63805] DAMAGECOUNT value on done: 16446.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:44,518][63805] Sum rewards: 1.940, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.003', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'AMMO4': '0.034', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO3': '0.091', 'weapon4': '0.100', 'HEALTH': '0.104', 'weapon5': '0.168', 'HITCOUNT': '0.260', 'WEAPON3': '0.450', 'ARMOR': '0.452', 'DAMAGECOUNT': '0.795', 'weapon3': '1.140', 'weapon2': '1.476', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:44,986][63805] DAMAGECOUNT value on done: 14330.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:45,908][63735] DAMAGECOUNT value on done: 13940.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:45,909][63735] Sum rewards: -2.594, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.390', 'AMMO5': '0.015', 'AMMO2': '0.019', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'weapon5': '0.064', 'AMMO4': '0.096', 'weapon4': '0.164', 'AMMO3': '0.178', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'HITCOUNT': '0.280', 'DAMAGECOUNT': '0.783', 'WEAPON3': '1.100', 'weapon2': '1.532', 'weapon3': '1.794', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:46,357][63733] Updated weights for policy 1, policy_version 2580 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:46,358][63735] DAMAGECOUNT value on done: 18504.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:46,359][63735] Sum rewards: -3.299, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.871', 'weapon4': '0.002', 'AMMO5': '0.015', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.064', 'AMMO4': '0.092', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'weapon5': '0.116', 'AMMO3': '0.166', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.800', 'weapon3': '1.512', 'weapon2': '1.572', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:46,664][63806] DAMAGECOUNT value on done: 14995.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:46,665][63806] Sum rewards: -4.164, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.438', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO2': '0.039', 'weapon4': '0.040', 'AMMO3': '0.116', 'AMMO4': '0.195', 'HITCOUNT': '0.230', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'weapon5': '0.388', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.804', 'FRAGCOUNT': '1.000', 'weapon3': '1.024', 'weapon2': '2.002'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:46,808][63805] DAMAGECOUNT value on done: 16119.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:46,991][63806] DAMAGECOUNT value on done: 15526.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:46,992][63806] Sum rewards: -1.489, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.296', 'AMMO5': '0.018', 'AMMO2': '0.023', 'WEAPON1': '0.060', 'weapon4': '0.060', 'weapon5': '0.084', 'AMMO4': '0.113', 'AMMO3': '0.119', 'WEAPON4': '0.150', 'HITCOUNT': '0.260', 'WEAPON5': '0.350', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.870', 'weapon2': '1.430', 'weapon3': '1.670', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:47,198][63805] DAMAGECOUNT value on done: 18010.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:47,198][63805] Sum rewards: -3.945, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.980', 'AMMO2': '0.006', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.031', 'weapon4': '0.062', 'AMMO3': '0.135', 'WEAPON4': '0.150', 'weapon5': '0.160', 'HITCOUNT': '0.230', 'WEAPON5': '0.250', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.936', 'weapon3': '1.308', 'weapon2': '1.832', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:47,458][109198] Fps is (10 sec: 10649.6, 60 sec: 10854.4, 300 sec: 11107.8). Total num frames: 20275200. Throughput: 0: 1360.5, 1: 1367.5. Samples: 5059479. Policy #0 lag: (min: 0.0, avg: 0.4, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:47,460][109198] Avg episode reward: [(0, '-1.325'), (1, '-1.551')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:47,633][63732] Updated weights for policy 0, policy_version 2370 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:49,678][63734] DAMAGECOUNT value on done: 14977.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:49,678][63734] Sum rewards: 0.710, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.831', 'AMMO5': '0.015', 'AMMO2': '0.027', 'WEAPON1': '0.060', 'weapon4': '0.062', 'WEAPON4': '0.100', 'AMMO3': '0.102', 'AMMO4': '0.133', 'weapon5': '0.160', 'HITCOUNT': '0.170', 'WEAPON5': '0.300', 'ARMOR': '0.474', 'DAMAGECOUNT': '0.576', 'WEAPON3': '0.650', 'weapon2': '1.406', 'weapon3': '1.556', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:50,006][63767] DAMAGECOUNT value on done: 17924.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:50,007][63767] Sum rewards: -1.667, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.320', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.020', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'weapon4': '0.046', 'weapon7': '0.086', 'WEAPON4': '0.100', 'AMMO3': '0.120', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.140', 'WEAPON7': '0.200', 'WEAPON5': '0.350', 'weapon5': '0.444', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.756', 'weapon2': '1.272', 'weapon3': '1.372'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:50,076][63734] DAMAGECOUNT value on done: 15062.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:50,076][63734] Sum rewards: -3.423, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.494', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.014', 'ARMOR': '0.048', 'weapon5': '0.066', 'AMMO4': '0.068', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.118', 'AMMO3': '0.136', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.756', 'weapon3': '1.614', 'weapon2': '1.746', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:50,332][63767] DAMAGECOUNT value on done: 17117.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:50,332][63767] Sum rewards: -2.233, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.006', 'AMMO2': '0.010', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.050', 'weapon5': '0.076', 'WEAPON4': '0.100', 'weapon4': '0.130', 'AMMO3': '0.136', 'AMMO6': '0.220', 'AMMO7': '0.220', 'weapon7': '0.220', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'WEAPON7': '0.300', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.870', 'FRAGCOUNT': '1.000', 'weapon3': '1.522', 'weapon2': '1.644'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:52,378][63771] DAMAGECOUNT value on done: 15710.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:52,378][63771] Sum rewards: 0.478, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.007', 'weapon4': '0.008', 'AMMO2': '0.022', 'WEAPON1': '0.030', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'AMMO4': '0.109', 'AMMO3': '0.126', 'WEAPON5': '0.150', 'weapon5': '0.150', 'HITCOUNT': '0.170', 'HEALTH': '0.296', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.720', 'FRAGCOUNT': '1.000', 'weapon3': '1.064', 'weapon2': '2.094'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:52,458][109198] Fps is (10 sec: 10649.6, 60 sec: 10922.7, 300 sec: 11093.9). Total num frames: 20328448. Throughput: 0: 1358.9, 1: 1364.2. Samples: 5075782. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:52,460][109198] Avg episode reward: [(0, '-1.375'), (1, '-1.575')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:52,782][63771] DAMAGECOUNT value on done: 12397.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:52,782][63771] Sum rewards: -2.187, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.596', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'weapon7': '0.002', 'AMMO5': '0.005', 'WEAPON1': '0.030', 'weapon4': '0.034', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'HITCOUNT': '0.120', 'AMMO3': '0.141', 'WEAPON5': '0.150', 'weapon5': '0.192', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.220', 'weapon3': '2.126'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:53,892][63733] Updated weights for policy 1, policy_version 2590 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:55,170][63732] Updated weights for policy 0, policy_version 2380 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:55,219][63767] DAMAGECOUNT value on done: 17826.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:55,219][63767] Sum rewards: 2.715, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO2': '0.012', 'AMMO5': '0.012', 'ARMOR': '0.024', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'HEALTH': '0.057', 'AMMO4': '0.059', 'weapon5': '0.080', 'weapon4': '0.120', 'WEAPON5': '0.150', 'AMMO3': '0.166', 'HITCOUNT': '0.250', 'WEAPON3': '0.700', 'weapon2': '0.920', 'DAMAGECOUNT': '1.119', 'weapon3': '1.706', 'FRAGCOUNT': '4.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:55,338][63734] Large shaping reward 2.632 for [('FRAGCOUNT', 2.0, 2.0), ('HITCOUNT', 0.03, 3.0), ('DAMAGECOUNT', 0.6, 200), ('weapon7', 0.002)]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:55,606][63767] DAMAGECOUNT value on done: 19357.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:55,607][63767] Sum rewards: -5.028, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.122', 'AMMO5': '0.016', 'weapon4': '0.018', 'AMMO2': '0.020', 'ARMOR': '0.035', 'weapon5': '0.040', 'WEAPON1': '0.050', 'AMMO4': '0.098', 'WEAPON4': '0.150', 'AMMO3': '0.206', 'HITCOUNT': '0.210', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.741', 'WEAPON3': '1.050', 'weapon2': '1.056', 'FRAGCOUNT': '2.000', 'weapon3': '2.054'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:56,059][63769] DAMAGECOUNT value on done: 15795.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:56,060][63769] Sum rewards: 1.602, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.555', 'weapon4': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'AMMO5': '0.017', 'ARMOR': '0.032', 'AMMO4': '0.056', 'AMMO3': '0.066', 'WEAPON4': '0.100', 'HITCOUNT': '0.120', 'weapon5': '0.204', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.450', 'weapon3': '1.328', 'weapon2': '1.702', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:56,367][63769] DAMAGECOUNT value on done: 13998.0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:57,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10922.7, 300 sec: 11107.8). Total num frames: 20385792. Throughput: 0: 1358.2, 1: 1363.9. Samples: 5092237. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:06:57,460][109198] Avg episode reward: [(0, '-1.341'), (1, '-1.642')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:57,475][63770] DAMAGECOUNT value on done: 14965.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:57,475][63770] Sum rewards: 0.965, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.996', 'AMMO2': '0.001', 'AMMO4': '0.007', 'AMMO5': '0.010', 'WEAPON1': '0.030', 'weapon7': '0.062', 'ARMOR': '0.072', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.107', 'weapon5': '0.162', 'HITCOUNT': '0.180', 'WEAPON3': '0.650', 'weapon3': '1.358', 'DAMAGECOUNT': '1.527', 'weapon2': '1.894', 'FRAGCOUNT': '6.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:57,896][63770] DAMAGECOUNT value on done: 15698.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:57,983][63770] DAMAGECOUNT value on done: 17225.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:57,984][63770] Sum rewards: 3.121, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.065', 'weapon4': '0.002', 'AMMO5': '0.017', 'AMMO2': '0.023', 'ARMOR': '0.032', 'WEAPON1': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'AMMO4': '0.116', 'weapon5': '0.126', 'WEAPON5': '0.350', 'HITCOUNT': '0.410', 'WEAPON3': '0.700', 'weapon2': '1.306', 'DAMAGECOUNT': '1.563', 'weapon3': '1.998', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:58,379][63770] DAMAGECOUNT value on done: 15585.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:58,380][63770] Sum rewards: -4.740, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.960', 'AMMO2': '0.012', 'AMMO5': '0.015', 'WEAPON1': '0.030', 'AMMO4': '0.059', 'weapon5': '0.082', 'WEAPON4': '0.100', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'weapon4': '0.166', 'AMMO3': '0.182', 'HITCOUNT': '0.240', 'WEAPON5': '0.300', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.008', 'weapon2': '1.376', 'FRAGCOUNT': '2.000', 'weapon3': '2.100'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:59,344][63771] DAMAGECOUNT value on done: 13856.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:59,345][63771] Sum rewards: -4.963, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.154', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.010', 'weapon4': '0.026', 'weapon7': '0.048', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon5': '0.144', 'HITCOUNT': '0.180', 'AMMO3': '0.184', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.462', 'WEAPON3': '1.100', 'weapon2': '1.708', 'weapon3': '1.794', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:59,610][63734] DAMAGECOUNT value on done: 17770.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:59,610][63734] Sum rewards: -3.648, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.698', 'FRAGCOUNT': '-1.000', 'AMMO2': '0.007', 'AMMO5': '0.028', 'AMMO4': '0.034', 'WEAPON1': '0.040', 'AMMO3': '0.132', 'weapon5': '0.238', 'HITCOUNT': '0.290', 'WEAPON5': '0.450', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.035', 'weapon2': '1.118', 'weapon3': '2.278'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:59,739][63771] DAMAGECOUNT value on done: 17309.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:06:59,740][63771] Sum rewards: -3.519, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.108', 'AMMO2': '0.011', 'AMMO5': '0.012', 'weapon4': '0.024', 'WEAPON1': '0.030', 'ARMOR': '0.032', 'AMMO4': '0.052', 'weapon5': '0.060', 'WEAPON4': '0.100', 'AMMO3': '0.179', 'WEAPON5': '0.250', 'HITCOUNT': '0.280', 'weapon2': '0.928', 'WEAPON3': '0.950', 'DAMAGECOUNT': '1.053', 'weapon3': '2.378', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:00,038][63734] DAMAGECOUNT value on done: 15859.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:00,038][63734] Sum rewards: -1.141, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.736', 'AMMO2': '0.014', 'AMMO5': '0.022', 'WEAPON1': '0.040', 'AMMO4': '0.071', 'AMMO3': '0.147', 'weapon5': '0.260', 'HITCOUNT': '0.340', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.188', 'weapon2': '1.490', 'weapon3': '1.822', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:00,930][63769] DAMAGECOUNT value on done: 18557.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:00,930][63769] Sum rewards: -1.539, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.831', 'AMMO2': '0.001', 'AMMO5': '0.005', 'AMMO4': '0.006', 'ARMOR': '0.032', 'WEAPON1': '0.040', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.136', 'weapon4': '0.194', 'weapon5': '0.224', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.020', 'weapon3': '2.054'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:01,332][63769] DAMAGECOUNT value on done: 12616.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:01,399][63733] Updated weights for policy 1, policy_version 2600 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:01,679][63735] DAMAGECOUNT value on done: 15844.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:01,680][63735] Sum rewards: -1.602, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.764', 'AMMO5': '0.012', 'AMMO2': '0.021', 'WEAPON1': '0.060', 'AMMO4': '0.105', 'AMMO3': '0.113', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'weapon5': '0.272', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.966', 'weapon3': '1.424', 'weapon2': '1.878', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:02,134][63735] DAMAGECOUNT value on done: 13383.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:02,135][63735] Sum rewards: -6.650, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.484', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.012', 'AMMO5': '0.015', 'ARMOR': '0.044', 'WEAPON1': '0.050', 'AMMO4': '0.061', 'weapon5': '0.112', 'WEAPON4': '0.150', 'weapon4': '0.220', 'AMMO3': '0.239', 'HITCOUNT': '0.240', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.858', 'weapon2': '0.972', 'WEAPON3': '1.150', 'weapon3': '2.110'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:02,458][109198] Fps is (10 sec: 11059.3, 60 sec: 10922.7, 300 sec: 11093.9). Total num frames: 20439040. Throughput: 0: 1357.4, 1: 1363.4. Samples: 5100417. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:02,460][109198] Avg episode reward: [(0, '-1.516'), (1, '-1.782')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:02,679][63732] Updated weights for policy 0, policy_version 2390 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:05,450][63806] DAMAGECOUNT value on done: 14567.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:05,451][63806] Sum rewards: -1.686, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.218', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'ARMOR': '0.016', 'AMMO2': '0.035', 'AMMO3': '0.091', 'weapon4': '0.112', 'WEAPON5': '0.150', 'weapon5': '0.158', 'HITCOUNT': '0.160', 'AMMO4': '0.173', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.408', 'WEAPON3': '0.500', 'weapon2': '1.252', 'weapon3': '1.610', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:05,888][63806] DAMAGECOUNT value on done: 15826.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:05,889][63806] Sum rewards: -2.416, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.030', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.012', 'AMMO5': '0.017', 'WEAPON1': '0.060', 'AMMO4': '0.061', 'HITCOUNT': '0.090', 'AMMO3': '0.157', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.396', 'weapon5': '0.398', 'ARMOR': '0.524', 'WEAPON3': '0.800', 'weapon2': '1.012', 'weapon3': '2.086'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:07,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10922.7, 300 sec: 11093.9). Total num frames: 20496384. Throughput: 0: 1358.1, 1: 1365.6. Samples: 5117054. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:07,460][109198] Avg episode reward: [(0, '-1.526'), (1, '-1.785')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:08,778][63733] Updated weights for policy 1, policy_version 2610 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:08,861][63806] DAMAGECOUNT value on done: 15208.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:08,862][63806] Sum rewards: 2.691, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.121', 'AMMO5': '0.003', 'AMMO2': '0.008', 'weapon4': '0.024', 'WEAPON1': '0.030', 'weapon5': '0.030', 'AMMO4': '0.037', 'WEAPON5': '0.050', 'AMMO3': '0.092', 'WEAPON4': '0.100', 'HITCOUNT': '0.200', 'ARMOR': '0.523', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.639', 'weapon2': '1.278', 'weapon3': '1.498', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:09,182][63806] DAMAGECOUNT value on done: 15746.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:09,183][63806] Sum rewards: -5.527, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.305', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.023', 'AMMO2': '-0.005', 'weapon4': '0.010', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.064', 'weapon5': '0.092', 'WEAPON4': '0.100', 'AMMO3': '0.138', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.660', 'WEAPON3': '0.750', 'weapon3': '1.514', 'weapon2': '1.700'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:09,562][63805] DAMAGECOUNT value on done: 16429.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:09,563][63805] Sum rewards: 2.880, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.310', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'AMMO2': '0.024', 'weapon4': '0.026', 'WEAPON4': '0.050', 'AMMO3': '0.067', 'weapon5': '0.094', 'WEAPON5': '0.100', 'AMMO4': '0.118', 'HITCOUNT': '0.210', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.930', 'weapon3': '1.252', 'weapon2': '1.394', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:09,650][63805] DAMAGECOUNT value on done: 16653.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:09,651][63805] Sum rewards: -1.385, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.372', 'AMMO2': '0.003', 'AMMO4': '0.015', 'WEAPON1': '0.020', 'AMMO5': '0.023', 'AMMO3': '0.096', 'WEAPON4': '0.150', 'HITCOUNT': '0.160', 'weapon4': '0.194', 'WEAPON5': '0.400', 'weapon5': '0.456', 'ARMOR': '0.519', 'DAMAGECOUNT': '0.621', 'WEAPON3': '0.650', 'weapon3': '1.456', 'weapon2': '1.474', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:09,940][63805] DAMAGECOUNT value on done: 18433.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:09,941][63805] Sum rewards: 5.488, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.027', 'ARMOR': '0.053', 'AMMO3': '0.060', 'weapon4': '0.098', 'AMMO4': '0.132', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'weapon5': '0.232', 'WEAPON3': '0.250', 'HITCOUNT': '0.260', 'HEALTH': '0.895', 'weapon3': '1.152', 'DAMAGECOUNT': '1.269', 'weapon2': '1.742', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:10,025][63805] DAMAGECOUNT value on done: 14437.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:10,107][63732] Updated weights for policy 0, policy_version 2400 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:11,177][63735] DAMAGECOUNT value on done: 14120.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:11,178][63735] Sum rewards: -3.314, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.580', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO2': '0.029', 'weapon4': '0.030', 'WEAPON4': '0.050', 'ARMOR': '0.108', 'AMMO4': '0.142', 'AMMO3': '0.163', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.540', 'WEAPON3': '0.950', 'weapon2': '1.638', 'weapon3': '1.926', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:11,504][63735] DAMAGECOUNT value on done: 18602.0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:12,458][109198] Fps is (10 sec: 11059.1, 60 sec: 10922.7, 300 sec: 11080.0). Total num frames: 20549632. Throughput: 0: 1360.1, 1: 1368.2. Samples: 5133404. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:12,460][109198] Avg episode reward: [(0, '-1.570'), (1, '-1.746')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:12,773][63767] DAMAGECOUNT value on done: 18054.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:13,144][63767] DAMAGECOUNT value on done: 17416.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:13,144][63767] Sum rewards: -3.740, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.620', 'AMMO4': '-0.034', 'AMMO2': '-0.007', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'weapon5': '0.046', 'ARMOR': '0.096', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'AMMO3': '0.201', 'weapon4': '0.204', 'HITCOUNT': '0.280', 'DAMAGECOUNT': '0.897', 'WEAPON3': '0.950', 'weapon3': '1.770', 'weapon2': '1.796', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:14,999][63734] DAMAGECOUNT value on done: 15262.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:15,000][63734] Sum rewards: 0.389, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.587', 'AMMO2': '0.013', 'AMMO5': '0.020', 'ARMOR': '0.024', 'weapon4': '0.024', 'weapon5': '0.028', 'AMMO4': '0.063', 'WEAPON1': '0.080', 'AMMO3': '0.083', 'WEAPON4': '0.150', 'HITCOUNT': '0.200', 'WEAPON5': '0.400', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.855', 'weapon2': '1.520', 'weapon3': '1.666', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:15,431][63734] DAMAGECOUNT value on done: 15527.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:15,432][63734] Sum rewards: 1.074, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.070', 'AMMO2': '0.007', 'AMMO5': '0.011', 'AMMO4': '0.033', 'WEAPON1': '0.040', 'ARMOR': '0.060', 'weapon5': '0.074', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.110', 'weapon7': '0.172', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'WEAPON3': '0.650', 'weapon2': '1.050', 'DAMAGECOUNT': '1.350', 'weapon3': '2.046', 'FRAGCOUNT': '2.500'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:16,055][63733] Updated weights for policy 1, policy_version 2620 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:17,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10922.7, 300 sec: 11080.0). Total num frames: 20606976. Throughput: 0: 1360.2, 1: 1375.5. Samples: 5141767. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:17,460][109198] Avg episode reward: [(0, '-1.556'), (1, '-1.676')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:17,770][63771] DAMAGECOUNT value on done: 15964.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:17,770][63771] Sum rewards: -0.462, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.958', 'AMMO2': '0.007', 'AMMO5': '0.012', 'AMMO4': '0.035', 'ARMOR': '0.036', 'WEAPON1': '0.050', 'weapon5': '0.054', 'AMMO3': '0.097', 'WEAPON4': '0.100', 'weapon4': '0.118', 'HITCOUNT': '0.180', 'WEAPON5': '0.250', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.762', 'FRAGCOUNT': '1.000', 'weapon2': '1.322', 'weapon3': '1.772'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:17,890][63732] Updated weights for policy 0, policy_version 2410 (0.0010)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:18,230][63771] DAMAGECOUNT value on done: 12586.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:18,231][63771] Sum rewards: 0.189, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.180', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'AMMO5': '0.012', 'WEAPON1': '0.050', 'weapon7': '0.058', 'AMMO3': '0.060', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'HITCOUNT': '0.110', 'weapon5': '0.168', 'WEAPON5': '0.300', 'WEAPON3': '0.400', 'ARMOR': '0.500', 'DAMAGECOUNT': '0.567', 'weapon3': '1.226', 'weapon2': '1.622', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:19,091][63769] DAMAGECOUNT value on done: 15938.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:19,092][63769] Sum rewards: 0.786, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.470', 'AMMO2': '0.001', 'AMMO4': '0.004', 'weapon7': '0.006', 'AMMO5': '0.009', 'WEAPON1': '0.020', 'weapon4': '0.042', 'HITCOUNT': '0.060', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'WEAPON5': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.268', 'DAMAGECOUNT': '0.429', 'ARMOR': '0.503', 'WEAPON3': '0.700', 'weapon2': '1.510', 'weapon3': '1.746', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:19,453][63769] DAMAGECOUNT value on done: 14170.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:19,453][63769] Sum rewards: -0.249, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.928', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'AMMO5': '0.012', 'ARMOR': '0.032', 'WEAPON1': '0.040', 'weapon7': '0.066', 'AMMO3': '0.092', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.130', 'weapon5': '0.142', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.516', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.626', 'weapon3': '1.748'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:20,275][63767] DAMAGECOUNT value on done: 18064.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:20,276][63767] Sum rewards: -0.090, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.820', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'AMMO5': '0.020', 'WEAPON1': '0.020', 'WEAPON4': '0.100', 'AMMO3': '0.136', 'HITCOUNT': '0.230', 'weapon5': '0.232', 'WEAPON5': '0.350', 'ARMOR': '0.496', 'DAMAGECOUNT': '0.714', 'WEAPON3': '0.900', 'weapon2': '1.260', 'FRAGCOUNT': '2.000', 'weapon3': '2.030'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:20,679][63767] DAMAGECOUNT value on done: 19457.0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:22,458][109198] Fps is (10 sec: 11059.3, 60 sec: 10922.7, 300 sec: 11066.1). Total num frames: 20660224. Throughput: 0: 1347.9, 1: 1386.4. Samples: 5157984. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:22,460][109198] Avg episode reward: [(0, '-1.394'), (1, '-1.657')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:22,737][63770] DAMAGECOUNT value on done: 15316.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:22,737][63770] Sum rewards: 0.819, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.197', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'AMMO3': '0.121', 'WEAPON5': '0.250', 'weapon5': '0.250', 'HITCOUNT': '0.320', 'WEAPON3': '0.550', 'DAMAGECOUNT': '1.053', 'weapon2': '1.140', 'FRAGCOUNT': '2.000', 'weapon3': '2.034'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:23,121][63733] Updated weights for policy 1, policy_version 2630 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:23,169][63770] DAMAGECOUNT value on done: 15938.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:23,170][63770] Sum rewards: -4.391, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.086', 'AMMO5': '0.007', 'AMMO2': '0.012', 'weapon4': '0.014', 'WEAPON1': '0.040', 'AMMO4': '0.058', 'AMMO3': '0.102', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.220', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.720', 'FRAGCOUNT': '1.000', 'weapon3': '1.356', 'weapon2': '1.966'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:23,255][63770] DAMAGECOUNT value on done: 17354.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:23,255][63770] Sum rewards: -1.247, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.869', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.031', 'ARMOR': '0.068', 'AMMO3': '0.088', 'weapon4': '0.110', 'HITCOUNT': '0.120', 'weapon5': '0.150', 'AMMO4': '0.154', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.387', 'WEAPON3': '0.400', 'weapon3': '0.716', 'FRAGCOUNT': '2.000', 'weapon2': '2.378'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:23,662][63770] DAMAGECOUNT value on done: 15710.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:24,629][63771] DAMAGECOUNT value on done: 14204.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:24,629][63771] Sum rewards: -6.756, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.674', 'AMMO2': '0.006', 'AMMO5': '0.020', 'AMMO4': '0.029', 'WEAPON1': '0.040', 'weapon5': '0.072', 'AMMO3': '0.185', 'HITCOUNT': '0.190', 'WEAPON4': '0.250', 'weapon4': '0.260', 'WEAPON5': '0.400', 'FRAGCOUNT': '0.500', 'ARMOR': '0.532', 'DAMAGECOUNT': '1.044', 'WEAPON3': '1.050', 'weapon2': '1.564', 'weapon3': '1.776'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:24,994][63771] DAMAGECOUNT value on done: 17464.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:24,994][63771] Sum rewards: -4.421, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.302', 'AMMO5': '0.018', 'AMMO2': '0.023', 'WEAPON1': '0.040', 'weapon5': '0.042', 'weapon4': '0.064', 'ARMOR': '0.104', 'AMMO4': '0.117', 'AMMO3': '0.130', 'HITCOUNT': '0.140', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.388', 'weapon2': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:25,084][63734] DAMAGECOUNT value on done: 18131.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:25,085][63734] Sum rewards: -0.200, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.500', 'AMMO4': '-0.004', 'AMMO2': '-0.001', 'ARMOR': '0.012', 'AMMO5': '0.024', 'weapon4': '0.024', 'WEAPON4': '0.050', 'WEAPON1': '0.060', 'AMMO3': '0.143', 'HITCOUNT': '0.250', 'WEAPON5': '0.400', 'weapon5': '0.522', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.083', 'weapon2': '1.448', 'FRAGCOUNT': '1.500', 'weapon3': '1.738'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:25,502][63734] DAMAGECOUNT value on done: 16118.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:25,502][63734] Sum rewards: -3.107, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.340', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO5': '0.020', 'AMMO4': '0.022', 'weapon5': '0.026', 'AMMO3': '0.138', 'HITCOUNT': '0.230', 'WEAPON5': '0.350', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.777', 'FRAGCOUNT': '1.000', 'weapon2': '1.220', 'weapon3': '1.936'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:25,960][63732] Updated weights for policy 0, policy_version 2420 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:26,120][63769] DAMAGECOUNT value on done: 18652.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:26,121][63769] Sum rewards: -1.849, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'AMMO2': '0.021', 'ARMOR': '0.033', 'weapon5': '0.068', 'AMMO3': '0.099', 'WEAPON5': '0.100', 'AMMO4': '0.104', 'HITCOUNT': '0.110', 'WEAPON4': '0.200', 'weapon4': '0.260', 'DAMAGECOUNT': '0.285', 'HEALTH': '0.446', 'WEAPON3': '0.550', 'weapon2': '1.252', 'weapon3': '1.848'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:26,432][63769] DAMAGECOUNT value on done: 13056.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:26,432][63769] Sum rewards: 3.133, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-1.430', 'AMMO5': '0.005', 'AMMO2': '0.010', 'WEAPON1': '0.020', 'AMMO4': '0.052', 'ARMOR': '0.064', 'AMMO3': '0.088', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.170', 'weapon4': '0.212', 'HITCOUNT': '0.290', 'WEAPON3': '0.650', 'weapon2': '1.198', 'DAMAGECOUNT': '1.320', 'weapon3': '1.784', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:26,438][63735] DAMAGECOUNT value on done: 15994.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:26,439][63735] Sum rewards: 0.842, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.059', 'weapon4': '0.004', 'AMMO5': '0.007', 'AMMO2': '0.038', 'WEAPON1': '0.040', 'AMMO3': '0.068', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'AMMO4': '0.191', 'WEAPON3': '0.400', 'weapon5': '0.414', 'DAMAGECOUNT': '0.450', 'weapon3': '0.914', 'FRAGCOUNT': '2.000', 'weapon2': '2.034'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:26,885][63735] DAMAGECOUNT value on done: 13583.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:26,886][63735] Sum rewards: 1.643, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO5': '0.007', 'AMMO2': '0.021', 'WEAPON1': '0.030', 'HEALTH': '0.048', 'WEAPON4': '0.050', 'weapon5': '0.078', 'AMMO4': '0.105', 'AMMO3': '0.107', 'ARMOR': '0.128', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'weapon4': '0.204', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.700', 'weapon2': '1.114', 'weapon3': '1.910', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:27,458][109198] Fps is (10 sec: 10649.6, 60 sec: 10923.2, 300 sec: 11080.0). Total num frames: 20713472. Throughput: 0: 1336.9, 1: 1400.3. Samples: 5174520. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:27,459][109198] Avg episode reward: [(0, '-1.254'), (1, '-1.732')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:29,728][63806] DAMAGECOUNT value on done: 14719.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:30,061][63733] Updated weights for policy 1, policy_version 2640 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:30,144][63806] DAMAGECOUNT value on done: 16126.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:30,144][63806] Sum rewards: -3.499, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.052', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'AMMO5': '0.026', 'weapon4': '0.078', 'AMMO4': '0.089', 'WEAPON4': '0.100', 'AMMO3': '0.239', 'HITCOUNT': '0.240', 'weapon5': '0.246', 'ARMOR': '0.400', 'WEAPON5': '0.450', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.900', 'weapon2': '1.468', 'weapon3': '1.880', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:31,199][63806] DAMAGECOUNT value on done: 15338.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:31,200][63806] Sum rewards: -3.353, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.213', 'AMMO5': '0.015', 'AMMO2': '0.017', 'ARMOR': '0.032', 'weapon5': '0.036', 'WEAPON1': '0.050', 'AMMO4': '0.087', 'HITCOUNT': '0.090', 'weapon4': '0.094', 'WEAPON4': '0.100', 'AMMO3': '0.119', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.478', 'weapon2': '1.552'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:31,562][63806] DAMAGECOUNT value on done: 15891.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:31,562][63806] Sum rewards: -4.220, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.594', 'AMMO5': '0.005', 'AMMO2': '0.010', 'weapon5': '0.040', 'ARMOR': '0.048', 'AMMO4': '0.050', 'WEAPON1': '0.060', 'WEAPON5': '0.100', 'AMMO3': '0.109', 'HITCOUNT': '0.140', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.622', 'weapon3': '1.804'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:32,458][109198] Fps is (10 sec: 11059.2, 60 sec: 10990.9, 300 sec: 11066.1). Total num frames: 20770816. Throughput: 0: 1331.4, 1: 1407.8. Samples: 5182742. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:32,460][109198] Avg episode reward: [(0, '-1.261'), (1, '-1.773')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:32,586][63805] DAMAGECOUNT value on done: 16464.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:32,991][63805] DAMAGECOUNT value on done: 18483.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:33,981][63732] Updated weights for policy 0, policy_version 2430 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:34,610][63805] DAMAGECOUNT value on done: 17163.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:34,610][63805] Sum rewards: -6.579, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-3.050', 'AMMO4': '-0.036', 'AMMO2': '-0.007', 'AMMO5': '0.031', 'WEAPON4': '0.050', 'weapon5': '0.060', 'weapon4': '0.200', 'AMMO3': '0.237', 'HITCOUNT': '0.250', 'ARMOR': '0.435', 'WEAPON5': '0.500', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.500', 'DAMAGECOUNT': '1.530', 'weapon3': '1.718', 'weapon2': '1.754'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:35,066][63805] DAMAGECOUNT value on done: 14572.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:35,066][63805] Sum rewards: -5.482, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.746', 'ARMOR': '0.004', 'AMMO5': '0.015', 'AMMO2': '0.018', 'weapon5': '0.026', 'WEAPON1': '0.050', 'weapon4': '0.074', 'AMMO4': '0.089', 'WEAPON4': '0.100', 'AMMO3': '0.119', 'HITCOUNT': '0.150', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.850', 'weapon3': '1.520', 'weapon2': '1.794', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:35,936][63735] DAMAGECOUNT value on done: 14325.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:35,937][63735] Sum rewards: -2.534, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.985', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'weapon7': '0.090', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon4': '0.122', 'AMMO3': '0.156', 'HITCOUNT': '0.180', 'WEAPON7': '0.200', 'weapon5': '0.214', 'WEAPON5': '0.350', 'ARMOR': '0.460', 'DAMAGECOUNT': '0.615', 'WEAPON3': '1.050', 'weapon2': '1.092', 'FRAGCOUNT': '1.500', 'weapon3': '2.046'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:36,274][63735] DAMAGECOUNT value on done: 18917.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:36,275][63735] Sum rewards: -1.159, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO2': '0.008', 'AMMO5': '0.010', 'ARMOR': '0.028', 'WEAPON1': '0.030', 'AMMO4': '0.039', 'WEAPON4': '0.050', 'weapon5': '0.096', 'AMMO3': '0.119', 'WEAPON5': '0.200', 'HITCOUNT': '0.240', 'HEALTH': '0.462', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.945', 'FRAGCOUNT': '1.000', 'weapon2': '1.612', 'weapon3': '1.752'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:37,191][63733] Updated weights for policy 1, policy_version 2650 (0.0011)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:37,458][109198] Fps is (10 sec: 11059.1, 60 sec: 10922.6, 300 sec: 11066.1). Total num frames: 20824064. Throughput: 0: 1319.1, 1: 1419.0. Samples: 5198998. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:37,460][109198] Avg episode reward: [(0, '-1.259'), (1, '-1.928')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:37,801][63767] DAMAGECOUNT value on done: 18286.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:37,802][63767] Sum rewards: -3.925, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.669', 'AMMO4': '-0.053', 'AMMO2': '-0.010', 'AMMO5': '0.007', 'weapon5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'WEAPON5': '0.150', 'AMMO3': '0.184', 'HITCOUNT': '0.230', 'DAMAGECOUNT': '0.696', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.246', 'weapon3': '2.274'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:38,260][63767] DAMAGECOUNT value on done: 17581.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:38,260][63767] Sum rewards: -0.654, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.852', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.005', 'WEAPON1': '0.030', 'weapon5': '0.032', 'ARMOR': '0.083', 'AMMO3': '0.084', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'HITCOUNT': '0.170', 'weapon4': '0.170', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.600', 'weapon2': '1.274', 'weapon3': '1.810', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:40,390][63734] DAMAGECOUNT value on done: 15466.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:40,391][63734] Sum rewards: -4.446, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.578', 'weapon5': '0.008', 'AMMO5': '0.010', 'weapon4': '0.012', 'AMMO2': '0.028', 'WEAPON1': '0.040', 'ARMOR': '0.044', 'AMMO4': '0.140', 'AMMO3': '0.176', 'WEAPON5': '0.200', 'HITCOUNT': '0.200', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.612', 'WEAPON3': '1.000', 'weapon2': '1.508', 'weapon3': '1.904', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:40,849][63734] DAMAGECOUNT value on done: 15926.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:40,849][63734] Sum rewards: 1.286, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.128', 'AMMO2': '0.007', 'AMMO5': '0.013', 'weapon5': '0.014', 'AMMO4': '0.036', 'weapon7': '0.050', 'AMMO3': '0.129', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.250', 'WEAPON4': '0.350', 'HITCOUNT': '0.370', 'ARMOR': '0.488', 'weapon4': '0.514', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.197', 'weapon3': '1.464', 'weapon2': '1.582', 'FRAGCOUNT': '2.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:42,175][63732] Updated weights for policy 0, policy_version 2440 (0.0011)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:42,286][63769] DAMAGECOUNT value on done: 16207.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:42,286][63769] Sum rewards: -2.318, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.885', 'WEAPON1': '0.020', 'ARMOR': '0.020', 'weapon4': '0.024', 'AMMO2': '0.024', 'AMMO5': '0.026', 'weapon7': '0.082', 'WEAPON4': '0.100', 'AMMO4': '0.120', 'AMMO3': '0.171', 'weapon5': '0.190', 'HITCOUNT': '0.240', 'AMMO6': '0.260', 'AMMO7': '0.260', 'WEAPON7': '0.300', 'WEAPON5': '0.500', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.807', 'FRAGCOUNT': '1.000', 'weapon2': '1.196', 'weapon3': '2.228'}\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:42,458][109198] Fps is (10 sec: 10649.5, 60 sec: 10922.7, 300 sec: 11052.3). Total num frames: 20877312. Throughput: 0: 1304.8, 1: 1426.6. Samples: 5215150. Policy #0 lag: (min: 0.0, avg: 0.3, max: 1.0)\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:42,460][109198] Avg episode reward: [(0, '-1.225'), (1, '-1.963')]\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:42,627][63769] DAMAGECOUNT value on done: 14653.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:42,628][63769] Sum rewards: 3.675, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.690', 'AMMO5': '0.010', 'AMMO2': '0.023', 'WEAPON1': '0.050', 'weapon4': '0.054', 'WEAPON4': '0.100', 'AMMO4': '0.115', 'AMMO3': '0.120', 'weapon5': '0.148', 'HITCOUNT': '0.300', 'WEAPON5': '0.300', 'ARMOR': '0.506', 'WEAPON3': '0.800', 'weapon2': '1.436', 'DAMAGECOUNT': '1.449', 'weapon3': '1.704', 'FRAGCOUNT': '5.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:43,112][63771] DAMAGECOUNT value on done: 16043.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:43,470][63771] DAMAGECOUNT value on done: 12806.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:43,470][63771] Sum rewards: 0.012, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.910', 'AMMO2': '0.005', 'WEAPON1': '0.020', 'AMMO5': '0.023', 'AMMO4': '0.026', 'ARMOR': '0.052', 'weapon7': '0.052', 'weapon5': '0.098', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.138', 'HITCOUNT': '0.190', 'WEAPON7': '0.200', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.660', 'WEAPON3': '0.850', 'weapon2': '1.194', 'weapon3': '2.074', 'FRAGCOUNT': '3.000'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:44,232][63733] Updated weights for policy 1, policy_version 2660 (0.0012)\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:44,233][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000002660_10895360.pth...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:44,233][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002442_10002432.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,239][63454] Stopping Batcher_0...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,241][109198] Component Batcher_0 stopped!\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,246][109198] Component Batcher_1 stopped!\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,246][63576] Stopping Batcher_1...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,254][63732] Weights refcount: 2 0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,256][109198] Component InferenceWorker_p0-w0 stopped!\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,255][63732] Stopping InferenceWorker_p0-w0...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,256][63732] Loop inference_proc0-0_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,256][63733] Weights refcount: 2 0\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,258][109198] Component InferenceWorker_p1-w0 stopped!\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,257][63733] Stopping InferenceWorker_p1-w0...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,258][63733] Loop inference_proc1-0_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,260][63454] Loop batcher_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,270][63576] Loop batcher_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,294][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002201_9015296.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:44,302][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002442_10002432.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,302][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000002376_9732096.pth\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:44,311][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000002660_10895360.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,313][109198] Component RolloutWorker_w5 stopped!\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,313][63771] Stopping RolloutWorker_w5...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,313][63771] Loop rollout_proc5_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,316][109198] Component RolloutWorker_w6 stopped!\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,316][63805] Stopping RolloutWorker_w6...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,316][63805] Loop rollout_proc6_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,316][63770] Stopping RolloutWorker_w4...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,317][63769] Stopping RolloutWorker_w3...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,317][63770] Loop rollout_proc4_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,317][63769] Loop rollout_proc3_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,318][109198] Component RolloutWorker_w4 stopped!\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,318][63734] Stopping RolloutWorker_w1...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,319][109198] Component RolloutWorker_w3 stopped!\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,319][63735] Stopping RolloutWorker_w0...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,321][109198] Component RolloutWorker_w1 stopped!\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,320][63734] Loop rollout_proc1_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,321][63767] Stopping RolloutWorker_w2...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,321][63806] Stopping RolloutWorker_w7...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,323][109198] Component RolloutWorker_w0 stopped!\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,324][109198] Component RolloutWorker_w2 stopped!\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,325][109198] Component RolloutWorker_w7 stopped!\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,323][63735] Loop rollout_proc0_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,323][63806] Loop rollout_proc7_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,323][63767] Loop rollout_proc2_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,392][109198] Component LearnerWorker_p0 stopped!\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,392][63454] Stopping LearnerWorker_p0...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,392][63454] Loop learner_proc0_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,403][109198] Component LearnerWorker_p1 stopped!\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,403][63576] Stopping LearnerWorker_p1...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,403][63576] Loop learner_proc1_evt_loop terminating...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:44,405][109198] Waiting for process learner_proc0 to stop...\u001b[0m\n", + "[W CudaIPCTypes.cpp:15] Producer process has been terminated before all shared CUDA tensors released. See Note [Sharing CUDA tensors]\n", + "[W CudaIPCTypes.cpp:15] Producer process has been terminated before all shared CUDA tensors released. See Note [Sharing CUDA tensors]\n", + "\u001b[36m[2023-09-14 15:07:45,204][109198] Waiting for process learner_proc1 to stop...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:45,238][109198] Waiting for process inference_proc0-0 to join...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:45,241][109198] Waiting for process inference_proc1-0 to join...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:45,243][109198] Waiting for process rollout_proc0 to join...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:45,245][109198] Waiting for process rollout_proc1 to join...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:45,247][109198] Waiting for process rollout_proc2 to join...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:45,249][109198] Waiting for process rollout_proc3 to join...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:45,251][109198] Waiting for process rollout_proc4 to join...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:45,254][109198] Waiting for process rollout_proc5 to join...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:45,256][109198] Waiting for process rollout_proc6 to join...\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:45,257][109198] Waiting for process rollout_proc7 to join...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:45,259][109198] Batcher 0 profile tree view:\n", + "batching: 64.5557, releasing_batches: 0.0680\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:45,260][109198] Batcher 1 profile tree view:\n", + "batching: 68.7785, releasing_batches: 0.0768\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:45,260][109198] InferenceWorker_p0-w0 profile tree view:\n", + "wait_policy: 0.0000\n", + " wait_policy_total: 30.4046\n", + "update_model: 14.8111\n", + " weight_update: 0.0012\n", + "one_step: 0.0035\n", + " handle_policy_step: 1755.1900\n", + " deserialize: 33.0362, stack: 6.5566, obs_to_device_normalize: 298.8561, forward: 1199.1000, send_messages: 52.4071\n", + " prepare_outputs: 113.7009\n", + " to_cpu: 62.3233\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:45,261][109198] InferenceWorker_p1-w0 profile tree view:\n", + "wait_policy: 0.0000\n", + " wait_policy_total: 25.0696\n", + "update_model: 14.1502\n", + " weight_update: 0.0012\n", + "one_step: 0.0037\n", + " handle_policy_step: 1761.3411\n", + " deserialize: 34.0947, stack: 6.4026, obs_to_device_normalize: 298.8298, forward: 1203.9989, send_messages: 54.2243\n", + " prepare_outputs: 113.1277\n", + " to_cpu: 61.8986\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:45,262][109198] Learner 0 profile tree view:\n", + "misc: 0.0111, prepare_batch: 32.0013\n", + "train: 137.3761\n", + " epoch_init: 0.0139, minibatch_init: 0.0137, losses_postprocess: 0.6089, kl_divergence: 1.7872, after_optimizer: 5.5057\n", + " calculate_losses: 37.0193\n", + " losses_init: 0.0076, forward_head: 1.8452, bptt_initial: 25.4128, tail: 2.4893, advantages_returns: 0.3729, losses: 4.2074\n", + " bptt: 2.3208\n", + " bptt_forward_core: 2.2331\n", + " update: 91.4740\n", + " clip: 71.3774\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:45,263][109198] Learner 1 profile tree view:\n", + "misc: 0.0145, prepare_batch: 34.6237\n", + "train: 145.7544\n", + " epoch_init: 0.0133, minibatch_init: 0.0146, losses_postprocess: 0.6706, kl_divergence: 1.9250, after_optimizer: 5.8193\n", + " calculate_losses: 40.0468\n", + " losses_init: 0.0077, forward_head: 2.0145, bptt_initial: 27.4411, tail: 2.6716, advantages_returns: 0.4205, losses: 4.6095\n", + " bptt: 2.4854\n", + " bptt_forward_core: 2.3893\n", + " update: 96.2356\n", + " clip: 74.1991\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:45,264][109198] RolloutWorker_w0 profile tree view:\n", + "wait_for_trajectories: 0.8971, enqueue_policy_requests: 47.9106, complete_rollouts: 1.7627, env_step: 1211.2031, overhead: 30.8770\n", + "save_policy_outputs: 52.9181\n", + " split_output_tensors: 18.5308\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:45,265][109198] RolloutWorker_w7 profile tree view:\n", + "wait_for_trajectories: 0.8981, enqueue_policy_requests: 47.0892, complete_rollouts: 1.6376, env_step: 1224.4394, overhead: 31.0357\n", + "save_policy_outputs: 53.1775\n", + " split_output_tensors: 18.7362\u001b[0m\n", + "\u001b[36m[2023-09-14 15:07:45,266][109198] Loop Runner_EvtLoop terminating...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:45,266][109198] Runner profile tree view:\n", + "main_loop: 1875.4927\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 15:07:45,267][109198] Collected {0: 10002432, 1: 10895360}, FPS: 11142.6\u001b[0m\n" + ] + } + ], + "source": [ + "\n", + "## Start the training, this should take around 15 minutes\n", + "register_vizdoom_components()\n", + "\n", + "# The scenario we train on today is health gathering\n", + "# other scenarios include \"doom_basic\", \"doom_two_colors_easy\", \"doom_dm\", \"doom_dwango5\", \"doom_my_way_home\", \"doom_deadly_corridor\", \"doom_defend_the_center\", \"doom_defend_the_line\", \"predict_position\", \"take_cover\"\n", + "env = \"doom_deathmatch_bots\"\n", + "cfg = parse_vizdoom_cfg(\n", + " argv=[f\"--env={env}\", \"--num_workers=8\", \"--num_envs_per_worker=4\", \"--train_for_env_steps=100000000\"]\n", + ")\n", + "\n", + "status = run_rl(cfg)" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": {}, + "outputs": [ + { + "name": "stderr", + "output_type": "stream", + "text": [ + "\u001b[33m[2023-09-14 12:03:16,383][97397] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,385][97397] Overriding arg 'num_workers' with value 1 passed from command line\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,386][97397] Adding new argument 'no_render'=True that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,386][97397] Adding new argument 'save_video'=True that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,387][97397] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,387][97397] Adding new argument 'video_name'=None that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,388][97397] Adding new argument 'max_num_frames'=1000000000.0 that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,389][97397] Adding new argument 'max_num_episodes'=10 that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,389][97397] Adding new argument 'push_to_hub'=False that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,390][97397] Adding new argument 'hf_repository'=None that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,391][97397] Adding new argument 'policy_index'=0 that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,392][97397] Adding new argument 'eval_deterministic'=False that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,392][97397] Adding new argument 'train_script'=None that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,393][97397] Adding new argument 'enjoy_script'=None that is not in the saved config file!\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,394][97397] Using frameskip 1 and render_action_repeat=4 for evaluation\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,397][97397] Multi agent env, num agents: 2\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,424][97397] Doom resolution: 160x120, resize resolution: (128, 72)\u001b[0m\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.num_agents to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.num_agents` for environment variables or `env.get_wrapper_attr('num_agents')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.is_multiagent to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.is_multiagent` for environment variables or `env.get_wrapper_attr('is_multiagent')` that will search the reminding wrappers.\u001b[0m\n", + " logger.warn(\n", + "\u001b[36m[2023-09-14 12:03:16,428][97397] RunningMeanStd input shape: (23,)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,429][97397] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,430][97397] RunningMeanStd input shape: (1,)\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,443][97397] ConvEncoder: input_channels=3\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,582][97397] Conv encoder output size: 512\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:16,585][97397] Policy head output size: 640\u001b[0m\n", + "\u001b[33m[2023-09-14 12:03:17,532][97397] Loading state from checkpoint /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000246_1007616.pth...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:17,565][97397] Port 40300 is available\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:17,567][97397] Using port 40300\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:17,568][97397] Initializing env for player 0, init_info: {'port': 40300}...\u001b[0m\n", "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,229][39733] Initializing env for player 1, init_info: {'port': 40900}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,229][39698] Using port 40600 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,238][39698] Initializing env for player 1, init_info: {'port': 40600}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,253][39685] Initializing env for player 2, init_info: {'port': 40300}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,263][39696] Initializing env for player 2, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,264][39734] Initializing env for player 2, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,267][39699] Initializing env for player 2, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,274][39697] Initializing env for player 2, init_info: {'port': 40400}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,279][39733] Initializing env for player 2, init_info: {'port': 40900}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,291][39698] Initializing env for player 2, init_info: {'port': 40600}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,303][39685] Initializing env for player 3, init_info: {'port': 40300}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,315][39734] Initializing env for player 3, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,321][39697] Initializing env for player 3, init_info: {'port': 40400}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,322][39696] Initializing env for player 3, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,324][39699] Initializing env for player 3, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,335][39733] Initializing env for player 3, init_info: {'port': 40900}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,341][39698] Initializing env for player 3, init_info: {'port': 40600}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,353][39685] Initializing env for player 4, init_info: {'port': 40300}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,370][39734] Initializing env for player 4, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,371][39696] Initializing env for player 4, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,371][39697] Initializing env for player 4, init_info: {'port': 40400}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,383][39733] Initializing env for player 4, init_info: {'port': 40900}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,385][39699] Initializing env for player 4, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,392][39698] Initializing env for player 4, init_info: {'port': 40600}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,404][39685] Initializing env for player 5, init_info: {'port': 40300}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,418][39696] Initializing env for player 5, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,426][39734] Initializing env for player 5, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,427][39697] Initializing env for player 5, init_info: {'port': 40400}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,431][39699] Initializing env for player 5, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,435][39733] Initializing env for player 5, init_info: {'port': 40900}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,443][39698] Initializing env for player 5, init_info: {'port': 40600}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,455][39685] Initializing env for player 6, init_info: {'port': 40300}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,475][39696] Initializing env for player 6, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,477][39699] Initializing env for player 6, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,479][39697] Initializing env for player 6, init_info: {'port': 40400}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,483][39734] Initializing env for player 6, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,485][39733] Initializing env for player 6, init_info: {'port': 40900}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,499][39698] Initializing env for player 6, init_info: {'port': 40600}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,515][39685] Initializing env for player 7, init_info: {'port': 40300}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,527][39696] Initializing env for player 7, init_info: {'port': 40500}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,535][39697] Initializing env for player 7, init_info: {'port': 40400}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,535][39734] Initializing env for player 7, init_info: {'port': 41000}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,539][39699] Initializing env for player 7, init_info: {'port': 40800}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,539][39733] Initializing env for player 7, init_info: {'port': 40900}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:52,551][39698] Initializing env for player 7, init_info: {'port': 40600}...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:17,618][97397] Initializing env for player 1, init_info: {'port': 40300}...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:17,668][97397] 2 agent workers initialized for env 0!\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:17,670][97397] Using port 40300 on host...\u001b[0m\n", "Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. ss 'Q' to abort network game synchronization.\n", - "Waiting for players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: \\Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", "Contacting host: /Press 'Q' to abort network game synchronization.\n", "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 1. \n", - "Waiting for players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Waiting for other players: ..... [ 5/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 2. \n", - "Waiting for players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", + "Waiting for players: .. [ 2/ 2]\n", "Sending all here. \n", "\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", + "Total players: 2 \n", "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 2. 8]\n", - "Waiting for players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. \n", - "Waiting for other players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: \\Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Got connect from node 3. \n", - "Waiting for players: .... [ 4/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 3 8]\n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Total players: 8 8]/ 8] 8]\n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Got connect from node 2. \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Waiting for players: ....... [ 7/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "\n", - "Go \n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Contacting host: -\n", - "Got connect from node 6. \n", - "Waiting for players: ....... [ 7/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Got connect from node 4. 8]\n", - "Got connect from node 5. [ 5/ 8]\n", - "Got connect from node 6. 8]\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Got connect from node 6. 8]... [ 6/ 8]\n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "\n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Got connect from node 7. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Found AI3 (node 2, player 3) 8]\n", - "Found AI2 (node 3, player 4) \n", - "Got connect from node 5. 8]\n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Got connect from node 7. 8]\n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI3 (node 3, player 3) \n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Found AI2 (node 4, player 4) \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) 8]\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI3 (node 2, player 3) 8]\n", - "Found AI2 (node 3, player 4) \n", - "Console player number: 2 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Console player number: 3 8]\n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI3 (node 0, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "Found AI5 (node 5, player 6) 8]\n", - "Found AI6 (node 6, player 7) \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Found AI4 (node 4, player 5) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 7 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 5, player 5) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 0, player 2) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI4 (node 4, player 5) \n", - "\n", - "Found AI5 (node 5, player 6) \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Found AI6 (node 6, player 7) \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 7, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 5, player 5) \n", - "\n", - "Go \n", - "Found AI5 (node 6, player 6) \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Found AI6 (node 7, player 7) \n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 0, player 8) \n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "\n", - "Exchanging game information.\n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Go \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI4 (node 4, player 5) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 7, player 8) \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "\n", - "Go \n", - "Total players: 8 \n", - "\u001b[36m[2023-09-12 21:01:53,664][28625] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 0. Throughput: 0: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI5 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI7 (node 6, player 7) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 1, player 2) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,759][39685] Initialized w:0 v:0 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,761][39685] Initialized w:0 v:0 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,762][39685] Initialized w:0 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,762][39685] Initialized w:0 v:0 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,762][39685] Initialized w:0 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,762][39685] Initialized w:0 v:0 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,763][39685] Initialized w:0 v:0 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,763][39685] Initialized w:0 v:0 player:0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:53,765][39685] 8 agent workers initialized for env 0!\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI3 (node 0, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 0, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI2 (node 5, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI5 (node 2, player 3) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI7 (node 7, player 7) \n", - "Found AI6 (node 0, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI3 (node 6, player 6) \n", - "Found AI7 (node 0, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI7 (node 0, player 5) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI2 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI3 (node 6, player 6) \n", - "Found AI7 (node 7, player 7) \n", - "Found AI6 (node 0, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,832][39685] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:53,833][39685] Port 40301 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:53,833][39685] Using port 40301\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,834][39685] Initializing env for player 0, init_info: {'port': 40301}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI5 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI7 (node 5, player 5) \n", - "Found AI2 (node 0, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI5 (node 2, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI2 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 5, player 5) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI2 (node 6, player 6) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI3 (node 7, player 7) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI6 (node 0, player 8) \n", - "Found AI5 (node 0, player 6) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,863][39685] Using port 40301 on host...\u001b[0m\n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "\n", - "Found AI1 (node 0, player 2) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI2 (node 1, player 2) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI7 (node 5, player 5) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI5 (node 0, player 3) \n", - "Found AI2 (node 0, player 5) \n", - "Found AI2 (node 6, player 6) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI3 (node 0, player 7) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,884][39685] Initializing env for player 1, init_info: {'port': 40301}...\u001b[0m\n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "\n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI1 (node 0, player 3) \n", - "Found AI2 (node 5, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI2 (node 3, player 3) \n", - "\n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI7 (node 0, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Found AI3 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI7 (node 0, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "\n", - "Found AI4 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI4 (node 4, player 4) \n", - "\n", - "Found AI5 (node 5, player 5) \n", - "Found AI3 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI5 (node 5, player 5) \n", - "\n", - "Found AI3 (node 6, player 6) \n", - "\n", - "Found AI6 (node 7, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "\n", - "\n", - "Found AI4 (node 4, player 4) \n", - "Found AI1 (node 2, player 2) \n", - "\n", - "Found AI3 (node 0, player 3) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI6 (node 0, player 8) \n", - "\n", - "Found AI2 (node 2, player 2) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,935][39685] Initializing env for player 2, init_info: {'port': 40301}...\u001b[0m\n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI5 (node 0, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "Found AI2 (node 2, player 2) \n", - "\n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI5 (node 5, player 5) \n", - "Found AI3 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "\n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "\n", - "\n", - "\n", - "Found AI2 (node 0, player 2) \n", - "\n", - "Found AI1 (node 2, player 3) \n", - "\n", - "Found AI4 (node 3, player 4) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,991][39697] Initialized w:1 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,992][39685] Initializing env for player 3, init_info: {'port': 40301}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,993][39697] Initialized w:1 v:0 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,994][39697] Initialized w:1 v:0 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,994][39697] Initialized w:1 v:0 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,995][39697] Initialized w:1 v:0 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,995][39697] Initialized w:1 v:0 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,995][39697] Initialized w:1 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:53,995][39697] Initialized w:1 v:0 player:4\u001b[0m\n", - "\n", - "\u001b[36m[2023-09-12 21:01:53,997][39697] 8 agent workers initialized for env 1!\u001b[0m\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,031][39699] Initialized w:5 v:0 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,034][39699] Initialized w:5 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,034][39699] Initialized w:5 v:0 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,034][39699] Initialized w:5 v:0 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,035][39699] Initialized w:5 v:0 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,035][39734] Initialized w:7 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,035][39699] Initialized w:5 v:0 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,036][39699] Initialized w:5 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,036][39699] Initialized w:5 v:0 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,038][39734] Initialized w:7 v:0 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,038][39734] Initialized w:7 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,038][39734] Initialized w:7 v:0 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,038][39734] Initialized w:7 v:0 player:6\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,038][39699] 8 agent workers initialized for env 5!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,039][39734] Initialized w:7 v:0 player:0\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,039][39734] Initialized w:7 v:0 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,039][39734] Initialized w:7 v:0 player:1\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,042][39734] 8 agent workers initialized for env 7!\u001b[0m\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,055][39733] Initialized w:6 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,055][39685] Initializing env for player 4, init_info: {'port': 40301}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,056][39697] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,057][39733] Initialized w:6 v:0 player:1\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,058][39697] Port 40401 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,058][39697] Using port 40401\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,058][39733] Initialized w:6 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,058][39733] Initialized w:6 v:0 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,058][39733] Initialized w:6 v:0 player:6\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,058][39697] Initializing env for player 0, init_info: {'port': 40401}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,059][39733] Initialized w:6 v:0 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,059][39733] Initialized w:6 v:0 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,059][39733] Initialized w:6 v:0 player:0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,061][39733] 8 agent workers initialized for env 6!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,064][39731] Initializing env for player 0, init_info: {'port': 40700}...\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,086][39699] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,088][39699] Port 40801 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,089][39699] Using port 40801\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,089][39699] Initializing env for player 0, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,091][39734] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,093][39734] Port 41001 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,094][39734] Using port 41001\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,094][39697] Using port 40401 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:5\u001b[0m\n", - "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.seed to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.seed` for environment variables or `env.get_wrapper_attr('seed')` that will search the reminding wrappers.\u001b[0m\n", - " logger.warn(\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,098][39731] Using port 40700 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:2\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,100][39698] 8 agent workers initialized for env 3!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,103][39685] Initializing env for player 5, init_info: {'port': 40301}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,112][39733] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,114][39733] Port 40901 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,115][39733] Using port 40901\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,115][39731] Initializing env for player 1, init_info: {'port': 40700}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,115][39733] Initializing env for player 0, init_info: {'port': 40901}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,119][39696] Initialized w:2 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,121][39696] Initialized w:2 v:0 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,121][39696] Initialized w:2 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,123][39697] Initializing env for player 1, init_info: {'port': 40401}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,124][39696] 8 agent workers initialized for env 2!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,132][39699] Using port 40801 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,141][39699] Initializing env for player 1, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,148][39698] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,149][39698] Port 40601 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,150][39698] Using port 40601\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,150][39698] Initializing env for player 0, init_info: {'port': 40601}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,157][39733] Using port 40901 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,157][39696] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,159][39696] Port 40501 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:54,159][39696] Using port 40501\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,166][39733] Initializing env for player 1, init_info: {'port': 40901}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,167][39685] Initializing env for player 6, init_info: {'port': 40301}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,165][39731] Initializing env for player 2, init_info: {'port': 40700}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,173][39697] Initializing env for player 2, init_info: {'port': 40401}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,179][39698] Using port 40601 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,192][39699] Initializing env for player 2, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,201][39698] Initializing env for player 1, init_info: {'port': 40601}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,213][39685] Initializing env for player 7, init_info: {'port': 40301}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,217][39731] Initializing env for player 3, init_info: {'port': 40700}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,219][39733] Initializing env for player 2, init_info: {'port': 40901}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,230][39697] Initializing env for player 3, init_info: {'port': 40401}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,242][39699] Initializing env for player 3, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,251][39698] Initializing env for player 2, init_info: {'port': 40601}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,269][39733] Initializing env for player 3, init_info: {'port': 40901}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,273][39731] Initializing env for player 4, init_info: {'port': 40700}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,283][39697] Initializing env for player 4, init_info: {'port': 40401}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,303][39698] Initializing env for player 3, init_info: {'port': 40601}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,318][39699] Initializing env for player 4, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,327][39731] Initializing env for player 5, init_info: {'port': 40700}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,339][39697] Initializing env for player 5, init_info: {'port': 40401}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,339][39733] Initializing env for player 4, init_info: {'port': 40901}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:54,355][39698] Initializing env for player 4, init_info: {'port': 40601}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:54,372][39699] Initializing env for player 5, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,387][39731] Initializing env for player 6, init_info: {'port': 40700}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,388][39733] Initializing env for player 5, init_info: {'port': 40901}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,395][39697] Initializing env for player 6, init_info: {'port': 40401}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,410][39698] Initializing env for player 5, init_info: {'port': 40601}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,427][39699] Initializing env for player 6, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,438][39733] Initializing env for player 6, init_info: {'port': 40901}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,443][39731] Initializing env for player 7, init_info: {'port': 40700}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,446][39697] Initializing env for player 7, init_info: {'port': 40401}...\u001b[0m\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:54,463][39698] Initializing env for player 6, init_info: {'port': 40601}...\u001b[0m\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:54,479][39699] Initializing env for player 7, init_info: {'port': 40801}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,499][39733] Initializing env for player 7, init_info: {'port': 40901}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:54,523][39698] Initializing env for player 7, init_info: {'port': 40601}...\u001b[0m\n", - "Got connect from node 1. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 2. \n", - "Waiting for players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Waiting for players: ...... [ 6/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 1. \n", - "Waiting for players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Waiting for players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. \n", - "Waiting for players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. 8]\n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Waiting for players: .... [ 4/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 6. \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 3. 8]\n", - "Got connect from node 4. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 2. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Done waiting.Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 3. 8]\n", - "Got connect from node 4. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Waiting for players: ....... [ 7/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Got connect from node 2. 8]\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Console player number: 7 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 5. 8]\n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Console player number: 2 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 8]\n", - "Waiting for other players: ....\n", - "Waiting for other players: . [ 5/ 8]....8]..\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "\n", - "Go \n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 ... 7/ 8]. [ 7/ 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "\n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "\n", - "Exchanging game information.\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "\n", - "Go \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Total players: 8 \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Go \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "Received \"Go.\" \n", - "\n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI1 (node 1, player 2) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI4 (node 6, player 7) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI2 (node 3, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Found AI1 (node 0, player 2) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI4 (node 6, player 7) \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "\n", - "Go \n", - "Found AI4 (node 0, player 7) \n", - "Total players: 8 \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "\n", - "Found AI2 (node 0, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI4 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI4 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 0, player 3) \n", - "\n", - "Exchanging game information.\n", - "Found AI2 (node 3, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI4 (node 6, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI6 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI4 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI4 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI1 (node 1, player 2) \n", - "\n", - "Found AI2 (node 2, player 3) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI4 (node 2, player 3) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI7 (node 0, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 1, player 2) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI3 (node 4, player 4) \n", - "\n", - "Found AI3 (node 0, player 6) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI6 (node 0, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 0, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "\n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI4 (node 4, player 5) \n", - "\n", - "Found AI4 (node 3, player 4) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI6 (node 0, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI3 (node 0, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI2 (node 0, player 2) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,800][39685] Initialized w:0 v:1 player:4\u001b[0m\n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI3 (node 2, player 3) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,802][39685] Initialized w:0 v:1 player:1\u001b[0m\n", - "Found AI4 (node 3, player 4) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,802][39685] Initialized w:0 v:1 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,802][39685] Initialized w:0 v:1 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,802][39685] Initialized w:0 v:1 player:7\u001b[0m\n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,803][39685] Initialized w:0 v:1 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,803][39685] Initialized w:0 v:1 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,803][39685] Initialized w:0 v:1 player:2\u001b[0m\n", - "Found AI2 (node 4, player 5) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "\u001b[36m[2023-09-12 21:01:55,805][39685] 8 agent workers initialized for env 0!\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 0, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI3 (node 6, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI3 (node 6, player 6) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI4 (node 2, player 3) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 0, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "\n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI1 (node 2, player 2) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,848][39734] Initializing env for player 0, init_info: {'port': 41001}...\u001b[0m\n", - "Found AI2 (node 5, player 5) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI2 (node 0, player 5) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI2 (node 4, player 5) \n", - "\n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "\n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,857][39685] Decorrelating experience for 32 frames...\u001b[0m\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "Found AI1 (node 2, player 2) \n", - "\n", - "Found AI3 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "\n", - "\n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,898][39734] Using port 41001 on host...\u001b[0m\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,898][39734] Initializing env for player 1, init_info: {'port': 41001}...\u001b[0m\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,931][39698] Initialized w:3 v:1 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,933][39698] Initialized w:3 v:1 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,933][39698] Initialized w:3 v:1 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:55,937][39698] 8 agent workers initialized for env 3!\u001b[0m\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,950][39734] Initializing env for player 2, init_info: {'port': 41001}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,969][39733] Initialized w:6 v:1 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,971][39733] Initialized w:6 v:1 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,971][39733] Initialized w:6 v:1 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,972][39733] Initialized w:6 v:1 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,972][39733] Initialized w:6 v:1 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,972][39733] Initialized w:6 v:1 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,973][39733] Initialized w:6 v:1 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,973][39733] Initialized w:6 v:1 player:4\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:55,974][39733] 8 agent workers initialized for env 6!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,974][39698] Decorrelating experience for 32 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,977][39731] Initialized w:4 v:0 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,977][39731] Initialized w:4 v:0 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,978][39731] Initialized w:4 v:0 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,978][39731] Initialized w:4 v:0 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,978][39731] Initialized w:4 v:0 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,978][39696] Initializing env for player 0, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,978][39731] Initialized w:4 v:0 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,979][39731] Initialized w:4 v:0 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:55,979][39731] Initialized w:4 v:0 player:0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:55,982][39731] 8 agent workers initialized for env 4!\u001b[0m\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,004][39697] Initialized w:1 v:1 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,007][39697] Initialized w:1 v:1 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,007][39697] Initialized w:1 v:1 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,008][39697] Initialized w:1 v:1 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,008][39697] Initialized w:1 v:1 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,008][39697] Initialized w:1 v:1 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,008][39697] Initialized w:1 v:1 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,009][39697] Initialized w:1 v:1 player:7\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,011][39697] 8 agent workers initialized for env 1!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,015][39734] Initializing env for player 3, init_info: {'port': 41001}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,024][39731] Decorrelating experience for 0 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,024][39696] Using port 40501 on host...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,029][39731] Port 40701 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,029][39731] Using port 40701\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,030][39731] Initializing env for player 0, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,030][39733] Decorrelating experience for 32 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,035][39696] Initializing env for player 1, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,042][39697] Decorrelating experience for 32 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,055][39699] Initialized w:5 v:1 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,056][39699] Initialized w:5 v:1 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,057][39699] Initialized w:5 v:1 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,057][39699] Initialized w:5 v:1 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,057][39699] Initialized w:5 v:1 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,058][39699] Initialized w:5 v:1 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,058][39699] Initialized w:5 v:1 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,059][39699] Initialized w:5 v:1 player:5\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,061][39699] 8 agent workers initialized for env 5!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,067][39734] Initializing env for player 4, init_info: {'port': 41001}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,070][39731] Using port 40701 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,080][39731] Initializing env for player 1, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,088][39696] Initializing env for player 2, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,096][39699] Decorrelating experience for 32 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,131][39731] Initializing env for player 2, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,126][39734] Initializing env for player 5, init_info: {'port': 41001}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,139][39696] Initializing env for player 3, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,179][39734] Initializing env for player 6, init_info: {'port': 41001}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,183][39731] Initializing env for player 3, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,195][39696] Initializing env for player 4, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,231][39734] Initializing env for player 7, init_info: {'port': 41001}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,235][39731] Initializing env for player 4, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,241][39696] Initializing env for player 5, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,259][39685] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,284][39731] Initializing env for player 5, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,299][39696] Initializing env for player 6, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,306][39685] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,338][39731] Initializing env for player 6, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,340][39685] Port 40302 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,340][39685] Using port 40302\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,341][39685] Initializing env for player 0, init_info: {'port': 40302}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,360][39696] Initializing env for player 7, init_info: {'port': 40501}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,367][39698] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,387][39685] Using port 40302 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,391][39731] Initializing env for player 7, init_info: {'port': 40701}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,398][39685] Initializing env for player 1, init_info: {'port': 40302}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,413][39698] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,437][39733] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,455][39685] Initializing env for player 2, init_info: {'port': 40302}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,459][39698] Port 40602 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,459][39698] Using port 40602\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,460][39698] Initializing env for player 0, init_info: {'port': 40602}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,482][39733] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,505][39698] Using port 40602 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,505][39685] Initializing env for player 3, init_info: {'port': 40302}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,509][39697] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,516][39698] Initializing env for player 1, init_info: {'port': 40602}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,528][39733] Port 40902 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,528][39733] Using port 40902\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,529][39733] Initializing env for player 0, init_info: {'port': 40902}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,553][39697] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,555][39699] Multi agent env, num agents: 8\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,557][39685] Initializing env for player 4, init_info: {'port': 40302}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,566][39698] Initializing env for player 2, init_info: {'port': 40602}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:56,573][39733] Using port 40902 on host...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,584][39733] Initializing env for player 1, init_info: {'port': 40902}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,605][39699] Multi agent env, num agents: 8\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,611][39685] Initializing env for player 5, init_info: {'port': 40302}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,617][39698] Initializing env for player 3, init_info: {'port': 40602}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,621][39697] Port 40402 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:56,621][39697] Using port 40402\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,622][39697] Initializing env for player 0, init_info: {'port': 40402}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\u001b[36m[2023-09-12 21:01:56,637][39699] Port 40802 is available\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[36m[2023-09-12 21:01:56,637][39699] Using port 40802\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,637][39699] Initializing env for player 0, init_info: {'port': 40802}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,644][39733] Initializing env for player 2, init_info: {'port': 40902}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,658][39697] Using port 40402 on host...\u001b[0m\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:56,659][39685] Initializing env for player 6, init_info: {'port': 40302}...\u001b[0m\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:56,673][39697] Initializing env for player 1, init_info: {'port': 40402}...\u001b[0m\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:56,676][39698] Initializing env for player 4, init_info: {'port': 40602}...\u001b[0m\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Waiting for players: ... [ 3/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:56,681][39699] Using port 40802 on host...\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,688][39699] Initializing env for player 1, init_info: {'port': 40802}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,707][39733] Initializing env for player 3, init_info: {'port': 40902}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,713][39685] Initializing env for player 7, init_info: {'port': 40302}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:56,726][39697] Initializing env for player 2, init_info: {'port': 40402}...\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,739][39699] Initializing env for player 2, init_info: {'port': 40802}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,747][39698] Initializing env for player 5, init_info: {'port': 40602}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,755][39733] Initializing env for player 4, init_info: {'port': 40902}...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 3. \n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:56,787][39697] Initializing env for player 3, init_info: {'port': 40402}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,790][39699] Initializing env for player 3, init_info: {'port': 40802}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,801][39698] Initializing env for player 6, init_info: {'port': 40602}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,821][39733] Initializing env for player 5, init_info: {'port': 40902}...\u001b[0m\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:56,851][39698] Initializing env for player 7, init_info: {'port': 40602}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,851][39697] Initializing env for player 4, init_info: {'port': 40402}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,856][39699] Initializing env for player 4, init_info: {'port': 40802}...\u001b[0m\n", - "Waiting for other players: ...Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: .... [ 4/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. 8]\n", - "Got connect from node 2. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,883][39733] Initializing env for player 6, init_info: {'port': 40902}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,903][39697] Initializing env for player 5, init_info: {'port': 40402}...\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:56,927][39699] Initializing env for player 5, init_info: {'port': 40802}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,935][39733] Initializing env for player 7, init_info: {'port': 40902}...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Got connect from node 3. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,973][39699] Initializing env for player 6, init_info: {'port': 40802}...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 3. \n", - "Got connect from node 7. 8]\n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:57,024][39699] Initializing env for player 7, init_info: {'port': 40802}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:56,971][39697] Initializing env for player 6, init_info: {'port': 40402}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,035][39697] Initializing env for player 7, init_info: {'port': 40402}...\u001b[0m\n", - "Got connect from node 4. 8]\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Got connect from node 4. 8]\n", - "Waiting for players: ..... [ 5/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 7 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Waiting for other players: ..... [ 5/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Waiting for players: ..... [ 5/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Go \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "Waiting for other players: ..... [ 5/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Exchanging game information.\n", - "Exchanging game information.Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Contacting host: -\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Got connect from node 1. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Waiting for players: . [ 1/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI0_host (node 1, player 1) \n", - "Got connect from node 1. \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 1. \n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 2. 8]\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Found AI7 (node 7, player 8) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI5 (node 2, player 3) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI2 (node 3, player 4) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 6, player 6) \n", - "Found AI3 (node 7, player 7) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Found AI7 (node 0, player 8) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI0_host (node 1, player 1) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 1, player 2) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 3, player 3) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI6 (node 0, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Got connect from node 2. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI5 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI6 (node 0, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI7 (node 7, player 8) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 0, player 3) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Found AI2 (node 3, player 4) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI2 (node 4, player 4) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI3 (node 6, player 7) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI6 (node 6, player 6) \n", - "Found AI3 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Found AI1 (node 2, player 2) 8]\n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Waiting for players: ....... [ 7/ 8] 7/ 8]\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "\n", - "Found AI6 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) 8]8] [ 2/ 8]\n", - "Found AI4 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI1 (node 2, player 2) 8]\n", - "\n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Contacting host: -\n", - "Found AI6 (node 6, player 6) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Found AI5 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI6 (node 6, player 6) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI1 (node 0, player 2) \n", - "\n", - "Exchanging game information.Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "\n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for players: ... [ 3/ 8] 7/ 8]\n", - "Exchanging game information.\n", - "\n", - "Contacting host: -players: ....... [ 7/ 8]\n", - "\n", - "Contacting host: -\n", - "Got connect from node 4. 8]\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Waiting for players: ....... [ 7/ 8]\n", - "Got connect from node 7. 8]\n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Got connect from node 3. \n", - "Got connect from node 4. 4/ 8].. [ 5/ 8]\n", - "Got connect from node 5. [ 5/ 8]\n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - ".. [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) 8]\n", - "....... [ 7/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:57,632][39734] Initialized w:7 v:1 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,633][39734] Initialized w:7 v:1 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,633][39734] Initialized w:7 v:1 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,634][39734] Initialized w:7 v:1 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,634][39734] Initialized w:7 v:1 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,634][39734] Initialized w:7 v:1 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,634][39734] Initialized w:7 v:1 player:6\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,635][39734] Initialized w:7 v:1 player:5\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:57,636][39734] 8 agent workers initialized for env 7!\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Waiting for other players: ....... [ 7/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Got connect from node 3. 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,687][39696] Initialized w:2 v:1 player:5\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:57,688][39696] Initialized w:2 v:1 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,688][39696] Initialized w:2 v:1 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,689][39696] Initialized w:2 v:1 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,690][39696] Initialized w:2 v:1 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,690][39696] Initialized w:2 v:1 player:2\u001b[0m\n", - "Waiting for other players: .... [ 4/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:57,691][39696] Initialized w:2 v:1 player:3\u001b[0m\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Done waiting.\u001b[37m\u001b[1m[2023-09-12 21:01:57,692][39696] Initialized w:2 v:1 player:7\u001b[0m\n", - "Found AI6 (node 6, player 7) \n", - "Found AI5 (node 5, player 6) \n", - "\u001b[36m[2023-09-12 21:01:57,692][39696] 8 agent workers initialized for env 2!\u001b[0m\n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI4 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI1 (node 2, player 2) 8]\n", - "Found AI4 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ........ [ 8/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:57,710][39734] Decorrelating experience for 32 frames...\u001b[0m\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Console player number: 2 8]\n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) 8]\n", - "Found AI4 (node 3, player 3) 8]\n", - "Found AI2 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Console player number: 3 8]\n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Waiting for other players: ........ [ 8/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:57,747][39696] Decorrelating experience for 32 frames...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Found AI1 (node 0, player 2) \n", - "Found AI4 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI4 (node 0, player 3) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) 8]\n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI3 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 8]\n", - "Received All Here, sending ACK. \n", - "\n", - "Go \n", - "Total players: 8 \n", - "\n", - "\n", - "\n", - "\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Contacting host: -\n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Done waiting.\n", - "Exchanging game information.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Go \n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:57,901][39731] Initialized w:4 v:1 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,902][39731] Initialized w:4 v:1 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,902][39731] Initialized w:4 v:1 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,902][39731] Initialized w:4 v:1 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,903][39731] Initialized w:4 v:1 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,903][39731] Initialized w:4 v:1 player:0\u001b[0m\n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:57,904][39731] Initialized w:4 v:1 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,904][39731] Initialized w:4 v:1 player:2\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:57,906][39731] 8 agent workers initialized for env 4!\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:57,948][39731] Decorrelating experience for 32 frames...\u001b[0m\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[36m[2023-09-12 21:01:58,004][39734] Multi agent env, num agents: 8\u001b[0m\n", - "Found AI2 (node 2, player 3) 8]\n", - "Found AI3 (node 3, player 4) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI1 (node 1, player 2) \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 1, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[36m[2023-09-12 21:01:58,038][39734] Multi agent env, num agents: 8\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 0, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI5 (node 0, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Go \n", - "Total players: 8 \n", - "\u001b[36m[2023-09-12 21:01:58,069][39734] Port 41002 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:58,069][39734] Using port 41002\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,069][39734] Initializing env for player 0, init_info: {'port': 41002}...\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI5 (node 5, player 5) \n", - "Found AI4 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI5 (node 5, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 6, player 6) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI2 (node 3, player 3) \n", - "\n", - "Found AI6 (node 7, player 7) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI3 (node 4, player 4) \n", - "Found AI5 (node 0, player 8) \n", - "Found AI5 (node 5, player 5) \n", - "Found AI4 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:58,100][39734] Using port 41002 on host...\u001b[0m\n", - "Found AI2 (node 1, player 2) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI5 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI2 (node 0, player 2) \n", - "\n", - "Go \n", - "Found AI1 (node 2, player 3) \n", - "Total players: 8 \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:58,120][39734] Initializing env for player 1, init_info: {'port': 41002}...\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "\n", - "Found AI1 (node 0, player 3) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI3 (node 0, player 5) \n", - "\n", - "Found AI5 (node 5, player 6) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,171][39734] Initializing env for player 2, init_info: {'port': 41002}...\u001b[0m\n", - "\n", - "Exchanging game information.\n", - "\u001b[36m[2023-09-12 21:01:58,185][39696] Multi agent env, num agents: 8\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "\n", - "\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,227][39734] Initializing env for player 3, init_info: {'port': 41002}...\u001b[0m\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[36m[2023-09-12 21:01:58,232][39696] Multi agent env, num agents: 8\u001b[0m\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,239][39685] Initialized w:0 v:2 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,241][39685] Initialized w:0 v:2 player:6\u001b[0m\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,242][39685] Initialized w:0 v:2 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,243][39685] Initialized w:0 v:2 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,244][39685] Initialized w:0 v:2 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,245][39685] Initialized w:0 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,246][39685] Initialized w:0 v:2 player:4\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,249][39685] Initialized w:0 v:2 player:7\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[36m[2023-09-12 21:01:58,250][39685] 8 agent workers initialized for env 0!\u001b[0m\n", - "\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,275][39734] Initializing env for player 4, init_info: {'port': 41002}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI3 (node 3, player 4) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,279][39733] Initialized w:6 v:2 player:3\u001b[0m\n", - "Found AI1 (node 1, player 2) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI2 (node 2, player 3) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,281][39733] Initialized w:6 v:2 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,281][39733] Initialized w:6 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,284][39733] Initialized w:6 v:2 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,284][39733] Initialized w:6 v:2 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,287][39733] Initialized w:6 v:2 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,287][39733] Initialized w:6 v:2 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,288][39733] Initialized w:6 v:2 player:4\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:58,289][39733] 8 agent workers initialized for env 6!\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI7 (node 5, player 5) \n", - "Found AI4 (node 6, player 6) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,310][39698] Initialized w:3 v:2 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,313][39698] Initialized w:3 v:2 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,313][39698] Initialized w:3 v:2 player:2\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[36m[2023-09-12 21:01:58,318][39698] 8 agent workers initialized for env 3!\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI7 (node 5, player 5) \n", - "Found AI4 (node 6, player 6) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI6 (node 0, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,327][39734] Initializing env for player 5, init_info: {'port': 41002}...\u001b[0m\n", - "Found AI4 (node 4, player 5) \n", - "\u001b[36m[2023-09-12 21:01:58,328][39696] Port 40502 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:58,328][39696] Using port 40502\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,329][39696] Initializing env for player 0, init_info: {'port': 40502}...\u001b[0m\n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,329][39685] Decorrelating experience for 64 frames...\u001b[0m\n", - "Found AI1 (node 1, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,343][39733] Decorrelating experience for 64 frames...\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI7 (node 0, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI7 (node 5, player 5) \n", - "Found AI4 (node 0, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,362][39696] Using port 40502 on host...\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI7 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,379][39696] Initializing env for player 1, init_info: {'port': 40502}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,379][39734] Initializing env for player 6, init_info: {'port': 41002}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,384][39698] Decorrelating experience for 64 frames...\u001b[0m\n", - "\n", - "\u001b[36m[2023-09-12 21:01:58,395][39731] Multi agent env, num agents: 8\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,431][39696] Initializing env for player 2, init_info: {'port': 40502}...\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "\u001b[36m[2023-09-12 21:01:58,434][39731] Multi agent env, num agents: 8\u001b[0m\n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,442][39734] Initializing env for player 7, init_info: {'port': 41002}...\u001b[0m\n", - "\n", - "\n", - "\n", - "\n", - "\u001b[36m[2023-09-12 21:01:58,471][39731] Port 40702 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:58,471][39731] Using port 40702\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,472][39731] Initializing env for player 0, init_info: {'port': 40702}...\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,487][39696] Initializing env for player 3, init_info: {'port': 40502}...\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,509][39731] Using port 40702 on host...\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,522][39731] Initializing env for player 1, init_info: {'port': 40702}...\u001b[0m\n", - "\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,547][39696] Initializing env for player 4, init_info: {'port': 40502}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,571][39697] Initialized w:1 v:2 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,575][39731] Initializing env for player 2, init_info: {'port': 40702}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,577][39697] Initialized w:1 v:2 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,577][39697] Initialized w:1 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,578][39697] Initialized w:1 v:2 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,578][39697] Initialized w:1 v:2 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,578][39697] Initialized w:1 v:2 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,578][39697] Initialized w:1 v:2 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,579][39697] Initialized w:1 v:2 player:5\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:58,583][39697] 8 agent workers initialized for env 1!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,594][39696] Initializing env for player 5, init_info: {'port': 40502}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,615][39699] Initialized w:5 v:2 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,619][39699] Initialized w:5 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,620][39699] Initialized w:5 v:2 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,623][39699] Initialized w:5 v:2 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,625][39699] Initialized w:5 v:2 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,626][39699] Initialized w:5 v:2 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,626][39699] Initialized w:5 v:2 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,627][39699] Initialized w:5 v:2 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,627][39731] Initializing env for player 3, init_info: {'port': 40702}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:58,628][39699] 8 agent workers initialized for env 5!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,641][39697] Decorrelating experience for 64 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,655][39696] Initializing env for player 6, init_info: {'port': 40502}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:58,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,678][39731] Initializing env for player 4, init_info: {'port': 40702}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,707][39696] Initializing env for player 7, init_info: {'port': 40502}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:58,717][39699] Decorrelating experience for 64 frames...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:58,731][39731] Initializing env for player 5, init_info: {'port': 40702}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:58,795][39731] Initializing env for player 6, init_info: {'port': 40702}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:58,871][39731] Initializing env for player 7, init_info: {'port': 40702}...\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 3. \n", - "Waiting for players: .... [ 4/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: .... [ 4/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ...... [ 6/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[36m[2023-09-12 21:01:59,191][39733] Port 40903 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:59,191][39733] Using port 40903\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,192][39733] Initializing env for player 0, init_info: {'port': 40903}...\u001b[0m\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:59,221][39733] Using port 40903 on host...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Got connect from node 6. 8]\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,243][39733] Initializing env for player 1, init_info: {'port': 40903}...\u001b[0m\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Total players: 8 8]\n", - "Waiting for other players: \n", - "Waiting for other players: .. [ 8/ 8]. [ 1/ 8] [ 6/ 8]\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -\u001b[37m\u001b[1m[2023-09-12 21:01:59,293][39733] Initializing env for player 2, init_info: {'port': 40903}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:59,302][39685] Port 40303 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:59,302][39685] Using port 40303\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,302][39685] Initializing env for player 0, init_info: {'port': 40303}...\u001b[0m\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Waiting for players: ...... [ 6/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:59,347][39685] Using port 40303 on host...\u001b[0m\n", - "Waiting for players: ...... [ 6/ 8]\u001b[36m[2023-09-12 21:01:59,347][39698] Port 40603 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:59,348][39698] Using port 40603\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,347][39733] Initializing env for player 3, init_info: {'port': 40903}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,348][39698] Initializing env for player 0, init_info: {'port': 40603}...\u001b[0m\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,360][39685] Initializing env for player 1, init_info: {'port': 40303}...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:59,392][39698] Using port 40603 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,402][39698] Initializing env for player 1, init_info: {'port': 40603}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,409][39733] Initializing env for player 4, init_info: {'port': 40903}...\u001b[0m\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,419][39685] Initializing env for player 2, init_info: {'port': 40303}...\u001b[0m\n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 3 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Contacting host: -s: ... [ 3/ 8]\n", - "Go \n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:59,459][39698] Initializing env for player 2, init_info: {'port': 40603}...\u001b[0m\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:59,467][39733] Initializing env for player 5, init_info: {'port': 40903}...\u001b[0m\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:59,470][39685] Initializing env for player 3, init_info: {'port': 40303}...\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,517][39698] Initializing env for player 3, init_info: {'port': 40603}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,519][39733] Initializing env for player 6, init_info: {'port': 40903}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Waiting for other players: ........ [ 8/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:59,523][39685] Initializing env for player 4, init_info: {'port': 40303}...\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "\n", - "Found AI6 (node 6, player 7) \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI6 (node 7, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Found AI6 (node 6, player 7) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,575][39685] Initializing env for player 5, init_info: {'port': 40303}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,575][39698] Initializing env for player 4, init_info: {'port': 40603}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,578][39733] Initializing env for player 7, init_info: {'port': 40903}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 6, player 7) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "\u001b[36m[2023-09-12 21:01:59,592][39697] Port 40403 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:59,592][39697] Using port 40403\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,592][39697] Initializing env for player 0, init_info: {'port': 40403}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 6, player 7) \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,623][39698] Initializing env for player 5, init_info: {'port': 40603}...\u001b[0m\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Waiting for other players: ...... [ 6/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:59,629][39697] Using port 40403 on host...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 6, player 7) \n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 6, player 7) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,643][39697] Initializing env for player 1, init_info: {'port': 40403}...\u001b[0m\n", - "\n", - "Go \n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI2 (node 1, player 2) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI4 (node 3, player 4) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,664][39685] Initializing env for player 6, init_info: {'port': 40303}...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:59,664][39699] Port 40803 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:59,665][39699] Using port 40803\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,665][39699] Initializing env for player 0, init_info: {'port': 40803}...\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 0, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 0, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "\n", - "Exchanging game information.\n", - "Found AI2 (node 0, player 2) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:59,694][39697] Initializing env for player 2, init_info: {'port': 40403}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,695][39698] Initializing env for player 6, init_info: {'port': 40603}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:59,707][39699] Using port 40803 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,718][39699] Initializing env for player 1, init_info: {'port': 40803}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,719][39685] Initializing env for player 7, init_info: {'port': 40303}...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 0, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Exchanging game information.\n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI7 (node 0, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:59,744][39697] Initializing env for player 3, init_info: {'port': 40403}...\u001b[0m\n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:59,751][39698] Initializing env for player 7, init_info: {'port': 40603}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 7, player 8) \n", - "\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,768][39699] Initializing env for player 2, init_info: {'port': 40803}...\u001b[0m\n", - "\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI0_host (node 1, player 1) \n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:01:59,795][39697] Initializing env for player 4, init_info: {'port': 40403}...\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:59,819][39699] Initializing env for player 3, init_info: {'port': 40803}...\u001b[0m\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Go \n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Exchanging game information.\n", - "Found AI0_host (node 1, player 1) \n", - "Got connect from node 1. \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI5 (node 1, player 2) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI6 (node 6, player 7) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,857][39697] Initializing env for player 5, init_info: {'port': 40403}...\u001b[0m\n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,871][39699] Initializing env for player 4, init_info: {'port': 40803}...\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI5 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "\n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:59,887][39734] Initialized w:7 v:2 player:3\u001b[0m\n", - "Received All Here, sending ACK. \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,888][39734] Initialized w:7 v:2 player:6\u001b[0m\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,889][39734] Initialized w:7 v:2 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,890][39734] Initialized w:7 v:2 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,890][39734] Initialized w:7 v:2 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,891][39734] Initialized w:7 v:2 player:5\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,891][39734] Initialized w:7 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,892][39734] Initialized w:7 v:2 player:4\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[36m[2023-09-12 21:01:59,893][39734] 8 agent workers initialized for env 7!\u001b[0m\n", - "Found AI5 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI3 (node 0, player 6) \n", - "\n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Exchanging game information.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:01:59,911][39697] Initializing env for player 6, init_info: {'port': 40403}...\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI5 (node 0, player 2) \n", - "Found AI1 (node 2, player 3) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,931][39699] Initializing env for player 5, init_info: {'port': 40803}...\u001b[0m\n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 2, player 2) \n", - "Found AI1 (node 0, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI3 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:01:59,942][39734] Decorrelating experience for 64 frames...\u001b[0m\n", - "Found AI5 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI3 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI5 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI3 (node 6, player 6) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Got connect from node 2. \n", - "Waiting for players: ... [ 3/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,967][39697] Initializing env for player 7, init_info: {'port': 40403}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:01:59,979][39699] Initializing env for player 6, init_info: {'port': 40803}...\u001b[0m\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Waiting for players: . [ 1/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,039][39699] Initializing env for player 7, init_info: {'port': 40803}...\u001b[0m\n", - "Found AI1 (node 1, player 2) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI4 (node 4, player 5) \n", - "\n", - "Found AI5 (node 5, player 6) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI3 (node 2, player 3) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Waiting for players: ..... [ 5/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:02:00,070][39696] Initialized w:2 v:2 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,072][39696] Initialized w:2 v:2 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,072][39696] Initialized w:2 v:2 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,073][39696] Initialized w:2 v:2 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,073][39696] Initialized w:2 v:2 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,074][39696] Initialized w:2 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,074][39696] Initialized w:2 v:2 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,074][39696] Initialized w:2 v:2 player:4\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:00,076][39696] 8 agent workers initialized for env 2!\u001b[0m\n", - "Found AI1 (node 0, player 2) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Got connect from node 1. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Found AI1 (node 2, player 2) 8]\n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,122][39696] Decorrelating experience for 64 frames...\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI6 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 0, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Contacting host: -\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Contacting host: -s: ....... [ 7/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "\n", - "Got connect from node 3. 8]\n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -\n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,279][39731] Initialized w:4 v:2 player:5\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:1\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:02:00,282][39731] Initialized w:4 v:2 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,282][39731] Initialized w:4 v:2 player:6\u001b[0m\n", - "Waiting for other players: ........ [ 8/ 8]\u001b[36m[2023-09-12 21:02:00,283][39731] 8 agent workers initialized for env 4!\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Got connect from node 4. 8]\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,332][39731] Decorrelating experience for 64 frames...\u001b[0m\n", - "Console player number: 7 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Got connect from node 7. 8]\n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Waiting for players: ....... [ 7/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: \n", - "Console player number: 3 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Got connect from node 1. 8]\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Go \n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Got connect from node 7. 8]\n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Got connect from node 1. \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Got connect from node 2. \n", - "Waiting for players: ... [ 3/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[36m[2023-09-12 21:02:00,573][39734] Port 41003 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:00,573][39734] Using port 41003\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,573][39734] Initializing env for player 0, init_info: {'port': 41003}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,605][39734] Using port 41003 on host...\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Exchanging game information.\n", - "Exchanging game information.Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,624][39734] Initializing env for player 1, init_info: {'port': 41003}...\u001b[0m\n", - "\n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: ... [ 3/ 8]\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI2 (node 1, player 2) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI3 (node 4, player 5) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,674][39734] Initializing env for player 2, init_info: {'port': 41003}...\u001b[0m\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Go \n", - "Total players: 8 \n", - "Waiting for other players: .. [ 2/ 8]\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI2 (node 0, player 2) \n", - "Found AI1 (node 2, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 6, player 7) \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI7 (node 0, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 0, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:02:00,727][39734] Initializing env for player 3, init_info: {'port': 41003}...\u001b[0m\n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "\n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "\n", - "Found AI2 (node 2, player 2) \n", - "Found AI1 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI7 (node 7, player 7) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,775][39734] Initializing env for player 4, init_info: {'port': 41003}...\u001b[0m\n", - "Found AI6 (node 0, player 8) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI2 (node 2, player 3) \n", - "Got connect from node 2. \n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 0, player 4) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 0, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI6 (node 7, player 8) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Found AI3 (node 4, player 4) \n", - "\u001b[36m[2023-09-12 21:02:00,838][39696] Port 40503 is available\u001b[0m\n", - "Found AI4 (node 5, player 5) \n", - "\u001b[36m[2023-09-12 21:02:00,838][39696] Using port 40503\u001b[0m\n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 7, player 7) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,838][39696] Initializing env for player 0, init_info: {'port': 40503}...\u001b[0m\n", - "Found AI6 (node 0, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Console player number: 3 8]\n", - "Received All Here, sending ACK. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,847][39734] Initializing env for player 5, init_info: {'port': 41003}...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,867][39696] Using port 40503 on host...\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "\n", - "\n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,889][39696] Initializing env for player 1, init_info: {'port': 40503}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,891][39734] Initializing env for player 6, init_info: {'port': 41003}...\u001b[0m\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Console player number: 2 8]\n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI4 (node 4, player 5) \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "\n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\u001b[36m[2023-09-12 21:02:00,925][39731] Port 40703 is available\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:00,925][39731] Using port 40703\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,926][39731] Initializing env for player 0, init_info: {'port': 40703}...\u001b[0m\n", - "\n", - "\n", - "Found AI1 (node 0, player 2) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI3 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "\n", - "\n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI7 (node 7, player 7) \n", - "Found AI6 (node 0, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) 8]\n", - "Console player number: 2 8]\n", - "Received All Here, sending ACK. \n", - "\n", - "Go \n", - "Total players: 8 \n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,943][39734] Initializing env for player 7, init_info: {'port': 41003}...\u001b[0m\n", - "Console player number: 3 8]\n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,949][39696] Initializing env for player 2, init_info: {'port': 40503}...\u001b[0m\n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "\n", - "Exchanging game information.\n", - "Console player number: 6 8]\n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI3 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:02:00,968][39733] Initialized w:6 v:3 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,969][39733] Initialized w:6 v:3 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,969][39733] Initialized w:6 v:3 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,970][39733] Initialized w:6 v:3 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,970][39733] Initialized w:6 v:3 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,971][39731] Using port 40703 on host...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,971][39733] Initialized w:6 v:3 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,971][39733] Initialized w:6 v:3 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,972][39733] Initialized w:6 v:3 player:0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:00,973][39733] 8 agent workers initialized for env 6!\u001b[0m\n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:02:00,984][39731] Initializing env for player 1, init_info: {'port': 40703}...\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI7 (node 0, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:00,999][39696] Initializing env for player 3, init_info: {'port': 40503}...\u001b[0m\n", - "Found AI7 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "Go \n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,016][39733] Decorrelating experience for 96 frames...\u001b[0m\n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,031][39685] Initialized w:0 v:3 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,033][39685] Initialized w:0 v:3 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,034][39685] Initialized w:0 v:3 player:5\u001b[0m\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,034][39685] Initialized w:0 v:3 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,035][39685] Initialized w:0 v:3 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,035][39685] Initialized w:0 v:3 player:0\u001b[0m\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,039][39685] Initialized w:0 v:3 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,042][39731] Initializing env for player 2, init_info: {'port': 40703}...\u001b[0m\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,051][39696] Initializing env for player 4, init_info: {'port': 40503}...\u001b[0m\n", - "\n", - "Exchanging game information.\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,095][39731] Initializing env for player 3, init_info: {'port': 40703}...\u001b[0m\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,129][39696] Initializing env for player 5, init_info: {'port': 40503}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,153][39698] Initialized w:3 v:3 player:6\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,157][39698] Initialized w:3 v:3 player:4\u001b[0m\n", - "Found AI6 (node 3, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI4 (node 2, player 3) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:5\u001b[0m\n", - "Found AI3 (node 6, player 7) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:2\u001b[0m\n", - "Found AI5 (node 5, player 6) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:0\u001b[0m\n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,160][39698] Initialized w:3 v:3 player:3\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:01,162][39698] 8 agent workers initialized for env 3!\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI2 (node 0, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,180][39731] Initializing env for player 4, init_info: {'port': 40703}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,183][39696] Initializing env for player 6, init_info: {'port': 40503}...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI4 (node 2, player 3) \n", - "Found AI6 (node 3, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Found AI3 (node 2, player 3) work game synchronization.\n", - "Found AI2 (node 4, player 5) \n", - "Found AI6 (node 3, player 4) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "\n", - "Found AI5 (node 7, player 8) .\n", - "\n", - "Found AI1 (node 1, player 2) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 0, player 3) \n", - "Found AI6 (node 3, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI3 (node 0, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,233][39731] Initializing env for player 5, init_info: {'port': 40703}...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,236][39698] Decorrelating experience for 96 frames...\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI5 (node 6, player 6) \n", - "Found AI3 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI5 (node 0, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,251][39696] Initializing env for player 7, init_info: {'port': 40503}...\u001b[0m\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 0, player 3) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 3, player 4) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI2 (node 0, player 5) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI6 (node 0, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI4 (node 3, player 3) \n", - "Found AI5 (node 7, player 8) \n", - "Found AI6 (node 0, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI5 (node 5, player 6) \n", - "Found AI3 (node 6, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI4 (node 0, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI4 (node 6, player 6) \n", - "Found AI7 (node 0, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI6 (node 4, player 4) \n", - "Found AI2 (node 5, player 5) \n", - "Found AI4 (node 6, player 6) \n", - "Found AI7 (node 7, player 7) \n", - "Found AI5 (node 0, player 8) \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,303][39731] Initializing env for player 6, init_info: {'port': 40703}...\u001b[0m\n", - "Found AI1 (node 0, player 2) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI6 (node 3, player 4) \n", - "Found AI2 (node 4, player 5) \n", - "Found AI4 (node 5, player 6) \n", - "Found AI7 (node 6, player 7) \n", - "Found AI5 (node 7, player 8) \n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: -s: . [ 1/ 8]\n", - "\n", - "\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,369][39731] Initializing env for player 7, init_info: {'port': 40703}...\u001b[0m\n", - "\n", - "Got connect from node 1. \n", - "Got connect from node 2. \n", - "Waiting for players: ... [ 3/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /\u001b[37m\u001b[1m[2023-09-12 21:02:01,413][39697] Initialized w:1 v:3 player:3\u001b[0m\n", - "\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,415][39697] Initialized w:1 v:3 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,417][39697] Initialized w:1 v:3 player:0\u001b[0m\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:02:01,417][39697] Initialized w:1 v:3 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,418][39697] Initialized w:1 v:3 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,420][39697] Initialized w:1 v:3 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,421][39697] Initialized w:1 v:3 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,422][39697] Initialized w:1 v:3 player:5\u001b[0m\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "\u001b[36m[2023-09-12 21:02:01,423][39697] 8 agent workers initialized for env 1!\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for players: . [ 1/ 8]\u001b[37m\u001b[1m[2023-09-12 21:02:01,459][39699] Initialized w:5 v:3 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,461][39699] Initialized w:5 v:3 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,461][39699] Initialized w:5 v:3 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,462][39699] Initialized w:5 v:3 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,463][39699] Initialized w:5 v:3 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,466][39699] Initialized w:5 v:3 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,466][39699] Initialized w:5 v:3 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,466][39699] Initialized w:5 v:3 player:3\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:01,467][39699] 8 agent workers initialized for env 5!\u001b[0m\n", - "Got connect from node 3. \n", - "Waiting for players: .... [ 4/ 8]\u001b[37m\u001b[1m[2023-09-12 21:02:01,494][39697] Decorrelating experience for 96 frames...\u001b[0m\n", - "Contacting host: -Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 1. 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:01,540][39699] Decorrelating experience for 96 frames...\u001b[0m\n", - "Waiting for players: . [ 1/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: .... [ 4/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Got connect from node 1. 8]\n", - "Waiting for players: .. [ 2/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .. [ 2/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 6. \n", - "Waiting for players: ....... [ 7/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Contacting host: /Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Got connect from node 2. 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Got connect from node 7. 8]\n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Got connect from node 3. 8]\n", - "Got connect from node 4. \n", - "Got connect from node 5. \n", - "Got connect from node 6. \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Got connect from node 2. 8]\n", - "Got connect from node 3. \n", - "Got connect from node 4. \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ... [ 3/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: .... [ 4/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ..... [ 5/ 8]\n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,032][39685] Initialized w:0 v:3 player:2\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:02,033][39685] 8 agent workers initialized for env 0!\u001b[0m\n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Got connect from node 5. \n", - "Console player number: 3 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 7 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 4 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 5 8]\n", - "Received All Here, sending ACK. \n", - "Console player number: 6 ..... [ 8/ 8]\n", - "Received All Here, sending ACK. \n", - "Press 'Q' to abort network game synchronization.\n", - "Network game synchronization timeout: 4s.\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "Go \n", - "Total players: 8 \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:02:02,105][39685] Decorrelating experience for 96 frames...\u001b[0m\n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Go \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Total players: 8 \n", - "\n", - "Waiting for other players: ...... [ 6/ 8]\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Got connect from node 6. \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. 8]\n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Contacting host: -\n", - "Exchanging game information.\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ....... [ 7/ 8]\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Got connect from node 7. \n", - "Waiting for players: ........ [ 8/ 8]\n", - "Sending all here. \n", - "\n", - "Found AI0_host (node 1, player 1) \n", - "Total players: 8 8]\n", - "\n", - "Waiting for other players: ........ [ 8/ 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) 8]\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) 8]\n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI6 (node 6, player 6) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 0, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI6 (node 0, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI4 (node 3, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI4 (node 7, player 8) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI1 (node 2, player 2) 8]\n", - "Found AI2 (node 3, player 3) \n", - "Found AI4 (node 0, player 4) \n", - "Found AI3 (node 4, player 5) \n", - "Found AI6 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 0, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI4 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Console player number: 1 \n", - "Received All Here, sending ACK. \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 0, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI4 (node 7, player 8) \n", - "Console player number: 2 \n", - "Received All Here, sending ACK. \n", - "Console player number: 7 \n", - "Received All Here, sending ACK. \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI4 (node 4, player 4) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 5, player 5) \n", - "Found AI6 (node 6, player 6) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI7 (node 0, player 8) \n", - "Found AI6 (node 0, player 5) \n", - "Console player number: 3 \n", - "Received All Here, sending ACK. \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI4 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI7 (node 0, player 6) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI4 (node 7, player 8) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI4 (node 7, player 8) \n", - "\n", - "Found AI1 (node 2, player 2) \n", - "Found AI2 (node 3, player 3) \n", - "Found AI3 (node 4, player 4) \n", - "Found AI6 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI4 (node 0, player 8) \n", - "Console player number: 4 \n", - "Received All Here, sending ACK. \n", - "Console player number: 6 \n", - "Received All Here, sending ACK. \n", - "\n", - "\n", - "Found AI1 (node 0, player 2) \n", - "Found AI2 (node 2, player 3) \n", - "Found AI3 (node 3, player 4) \n", - "Found AI6 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI4 (node 7, player 8) \n", - "\n", - "\n", - "\n", - "\n", - "Console player number: 5 \n", - "Received All Here, sending ACK. \n", - "\n", - "\n", - "Go \n", - "Total players: 8 \n", - "\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,510][39734] Initialized w:7 v:3 player:2\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,511][39734] Initialized w:7 v:3 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,512][39734] Initialized w:7 v:3 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,512][39734] Initialized w:7 v:3 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,512][39734] Initialized w:7 v:3 player:1\u001b[0m\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,513][39734] Initialized w:7 v:3 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,513][39734] Initialized w:7 v:3 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,514][39734] Initialized w:7 v:3 player:6\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:02,515][39734] 8 agent workers initialized for env 7!\u001b[0m\n", - "\n", - "Exchanging game information.\n", - "Exchanging game information.\n", - "Received All Here, sending ACK. \n", - "Received \"Go.\" \n", - "\n", - "Total players: 8 \n", - "\n", - "Exchanging game information.\u001b[37m\u001b[1m[2023-09-12 21:02:02,555][39734] Decorrelating experience for 96 frames...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,559][39696] Initialized w:2 v:3 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,560][39696] Initialized w:2 v:3 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,560][39696] Initialized w:2 v:3 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,560][39696] Initialized w:2 v:3 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,560][39696] Initialized w:2 v:3 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,561][39696] Initialized w:2 v:3 player:0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,561][39696] Initialized w:2 v:3 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,561][39696] Initialized w:2 v:3 player:7\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:02,563][39696] 8 agent workers initialized for env 2!\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,612][39696] Decorrelating experience for 96 frames...\u001b[0m\n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI0_host (node 1, player 1) \n", - "Found AI1 (node 1, player 2) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI1 (node 0, player 2) \n", - "Found AI3 (node 2, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 0, player 3) \n", - "Found AI2 (node 3, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 7, player 7) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI6 (node 0, player 8) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 0, player 4) \n", - "Found AI4 (node 4, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 0, player 5) \n", - "Found AI7 (node 5, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 6, player 6) \n", - "Found AI5 (node 0, player 7) \n", - "Found AI6 (node 7, player 8) \n", - "Found AI1 (node 2, player 2) \n", - "Found AI3 (node 3, player 3) \n", - "Found AI2 (node 4, player 4) \n", - "Found AI4 (node 5, player 5) \n", - "Found AI7 (node 0, player 6) \n", - "Found AI5 (node 6, player 7) \n", - "Found AI6 (node 7, player 8) \n", + "Waiting for other players: .. [ 2/ 2]\n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", "\n", + "Go \n", + "Total players: 2 \n", "\n", + "Console player number: 1 \n", + "Received All Here, sending ACK. \n", + "Received \"Go.\" \n", "\n", + "Total players: 2 \n", "\n", + "Found AI0_host (node 1, player 1) \n", + "Found AI1 (node 1, player 2) \n", + "Found AI1 (node 0, player 2) \n", "\n", "\n", - "\n", - "\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,881][39731] Initialized w:4 v:3 player:3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:7\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,884][39731] Initialized w:4 v:3 player:4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,884][39731] Initialized w:4 v:3 player:0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:02,887][39731] 8 agent workers initialized for env 4!\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:02,948][39731] Decorrelating experience for 96 frames...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:05,178][39537] Signal inference workers to stop experience collection...\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:05,203][39686] InferenceWorker_p0-w0: stopping experience collection\u001b[0m\n", - "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/torch/nn/modules/module.py:1501: UserWarning: operator() profile_node %43 : int[] = prim::profile_ivalue(%axis.1)\n", - " does not have profile information (Triggered internally at ../third_party/nvfuser/csrc/graph_fuser.cpp:104.)\n", - " return forward_call(*args, **kwargs)\n", - "\u001b[31m\u001b[1m[2023-09-12 21:02:06,207][39537] EvtLoop [learner_proc0_evt_loop, process=learner_proc0] unhandled exception in slot='on_new_training_batch' connected to emitter=Emitter(object_id='Batcher_0', signal_name='training_batches_available'), args=(0,)\u001b[0m\n", - "Traceback (most recent call last):\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py\", line 355, in _process_signal\n", - " slot_callable(*args)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner_worker.py\", line 150, in on_new_training_batch\n", - " stats = self.learner.train(self.batcher.training_batches[batch_idx])\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 1046, in train\n", - " train_stats = self._train(buff, self.cfg.batch_size, experience_size, num_invalids)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 731, in _train\n", - " ) = self._calculate_losses(mb, num_invalids)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 649, in _calculate_losses\n", - " exploration_loss = self.exploration_loss_func(action_distribution, valids, num_invalids)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 477, in _symmetric_kl_exploration_loss\n", - " kl_prior = action_distribution.symmetric_kl_with_uniform_prior()\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py\", line 247, in symmetric_kl_with_uniform_prior\n", - " sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions]\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py\", line 247, in \n", - " sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions]\n", - "AttributeError: 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior'\n", - "\u001b[33m[2023-09-12 21:02:06,208][39537] Unhandled exception 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' in evt loop learner_proc0_evt_loop\u001b[0m\n", - "Process learner_proc0:\n", - "Traceback (most recent call last):\n", - " File \"/home/cogstack/miniconda3/lib/python3.10/multiprocessing/process.py\", line 314, in _bootstrap\n", - " self.run()\n", - " File \"/home/cogstack/miniconda3/lib/python3.10/multiprocessing/process.py\", line 108, in run\n", - " self._target(*self._args, **self._kwargs)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py\", line 511, in _target\n", - " self.event_loop.exec()\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py\", line 403, in exec\n", - " raise exc\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py\", line 399, in exec\n", - " while self._loop_iteration():\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py\", line 383, in _loop_iteration\n", - " self._process_signal(s)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py\", line 358, in _process_signal\n", - " raise exc\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py\", line 355, in _process_signal\n", - " slot_callable(*args)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner_worker.py\", line 150, in on_new_training_batch\n", - " stats = self.learner.train(self.batcher.training_batches[batch_idx])\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 1046, in train\n", - " train_stats = self._train(buff, self.cfg.batch_size, experience_size, num_invalids)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 731, in _train\n", - " ) = self._calculate_losses(mb, num_invalids)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 649, in _calculate_losses\n", - " exploration_loss = self.exploration_loss_func(action_distribution, valids, num_invalids)\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py\", line 477, in _symmetric_kl_exploration_loss\n", - " kl_prior = action_distribution.symmetric_kl_with_uniform_prior()\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py\", line 247, in symmetric_kl_with_uniform_prior\n", - " sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions]\n", - " File \"/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py\", line 247, in \n", - " sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions]\n", - "AttributeError: 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior'\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,931][28625] Heartbeat connected on Batcher_0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,938][28625] Heartbeat connected on InferenceWorker_p0-w0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,944][28625] Heartbeat connected on RolloutWorker_w0\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,949][28625] Heartbeat connected on RolloutWorker_w1\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,953][28625] Heartbeat connected on RolloutWorker_w2\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,957][28625] Heartbeat connected on RolloutWorker_w3\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,961][28625] Heartbeat connected on RolloutWorker_w4\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,965][28625] Heartbeat connected on RolloutWorker_w5\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,968][28625] Heartbeat connected on RolloutWorker_w6\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:02:06,973][28625] Heartbeat connected on RolloutWorker_w7\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 483.2. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 362.4. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 289.9. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 241.6. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 207.1. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 181.2. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 161.1. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 161.1. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 161.1. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:02:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:03:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:04:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:33,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:48,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:05:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:06:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:07:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:08:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:09:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:28,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:10:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:23,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:28,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:43,670][28625] Components not started: LearnerWorker_p0, wait_time=600.0 seconds\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:11:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:38,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:12:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:13:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:14:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:48,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:53,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:15:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:16:58,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:17:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:23,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:28,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:18:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:13,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:18,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:33,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:19:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:33,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:43,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:20:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:43,670][28625] Components not started: LearnerWorker_p0, wait_time=1200.0 seconds\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:21:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:22:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:23:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:28,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:43,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:24:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:25:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:48,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:26:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:53,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:27:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:43,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:28:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:29:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:30:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:31:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:31:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:31:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:31:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:31:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0)\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:31:27,821][28625] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 28625], exiting...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:31:27,823][28625] Runner profile tree view:\n", - "main_loop: 1780.8502\u001b[0m\n", - "\u001b[36m[2023-09-12 21:31:27,824][39537] Stopping Batcher_0...\u001b[0m\n", - "\u001b[37m\u001b[1m[2023-09-12 21:31:27,825][28625] Collected {0: 0}, FPS: 0.0\u001b[0m\n", - "\u001b[36m[2023-09-12 21:31:27,825][39537] Loop batcher_evt_loop terminating...\u001b[0m\n" - ] - } - ], - "source": [ - "## Start the training, this should take around 15 minutes\n", - "register_vizdoom_components()\n", - "\n", - "# The scenario we train on today is health gathering\n", - "# other scenarios include \"doom_basic\", \"doom_two_colors_easy\", \"doom_dm\", \"doom_dwango5\", \"doom_my_way_home\", \"doom_deadly_corridor\", \"doom_defend_the_center\", \"doom_defend_the_line\", \"predict_position\", \"take_cover\"\n", - "env = \"doom_dwango5\"\n", - "cfg = parse_vizdoom_cfg(\n", - " argv=[f\"--env={env}\", \"--num_workers=8\", \"--num_envs_per_worker=4\", \"--train_for_env_steps=1000000\"]\n", - ")\n", - "\n", - "status = run_rl(cfg)" - ] - }, - { - "cell_type": "code", - "execution_count": 5, - "metadata": {}, - "outputs": [ - { - "name": "stderr", - "output_type": "stream", - "text": [ - "\u001b[33m[2023-09-12 21:01:01,865][28625] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,866][28625] Overriding arg 'num_workers' with value 1 passed from command line\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,867][28625] Adding new argument 'no_render'=True that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,869][28625] Adding new argument 'save_video'=True that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,870][28625] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,872][28625] Adding new argument 'video_name'=None that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,873][28625] Adding new argument 'max_num_frames'=1000000000.0 that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,875][28625] Adding new argument 'max_num_episodes'=10 that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,876][28625] Adding new argument 'push_to_hub'=False that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,877][28625] Adding new argument 'hf_repository'=None that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,877][28625] Adding new argument 'policy_index'=0 that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,878][28625] Adding new argument 'eval_deterministic'=False that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,879][28625] Adding new argument 'train_script'=None that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,879][28625] Adding new argument 'enjoy_script'=None that is not in the saved config file!\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,880][28625] Using frameskip 1 and render_action_repeat=4 for evaluation\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,881][28625] Multi agent env, num agents: 8\u001b[0m\n", - "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.num_agents to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.num_agents` for environment variables or `env.get_wrapper_attr('num_agents')` that will search the reminding wrappers.\u001b[0m\n", - " logger.warn(\n", - "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/gymnasium/core.py:311: UserWarning: \u001b[33mWARN: env.is_multiagent to get variables from other wrappers is deprecated and will be removed in v1.0, to get this variable you can do `env.unwrapped.is_multiagent` for environment variables or `env.get_wrapper_attr('is_multiagent')` that will search the reminding wrappers.\u001b[0m\n", - " logger.warn(\n", - "\u001b[36m[2023-09-12 21:01:01,913][28625] RunningMeanStd input shape: (23,)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,914][28625] RunningMeanStd input shape: (3, 72, 128)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,915][28625] RunningMeanStd input shape: (1,)\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,927][28625] ConvEncoder: input_channels=3\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,971][28625] Conv encoder output size: 512\u001b[0m\n", - "\u001b[36m[2023-09-12 21:01:01,974][28625] Policy head output size: 640\u001b[0m\n", - "\u001b[33m[2023-09-12 21:01:02,005][28625] No checkpoints found\u001b[0m\n" + "\u001b[37m\u001b[1m[2023-09-14 12:03:18,724][97397] Initialized w:0 v:0 player:0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:18,725][97397] Initialized w:0 v:0 player:1\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:19,234][97397] Num frames 100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:19,470][97397] Num frames 200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:19,714][97397] Num frames 300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:19,959][97397] Num frames 400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:20,180][97397] Num frames 500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:20,428][97397] Num frames 600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:20,660][97397] Num frames 700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:20,937][97397] Num frames 800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:21,231][97397] Num frames 900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:21,512][97397] Num frames 1000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:21,784][97397] Num frames 1100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:22,030][97397] Num frames 1200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:22,268][97397] Num frames 1300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:22,512][97397] Num frames 1400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:22,757][97397] Num frames 1500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:22,995][97397] Num frames 1600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:23,221][97397] Num frames 1700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:23,437][97397] Num frames 1800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:23,659][97397] Num frames 1900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:23,896][97397] Num frames 2000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:24,135][97397] Num frames 2100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:24,426][97397] Num frames 2200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:24,679][97397] Num frames 2300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:24,943][97397] Num frames 2400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:25,201][97397] Num frames 2500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:25,501][97397] Num frames 2600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:25,739][97397] Num frames 2700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:25,997][97397] Num frames 2800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:26,227][97397] Num frames 2900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:26,464][97397] Num frames 3000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:26,699][97397] Num frames 3100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:26,942][97397] Num frames 3200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:27,198][97397] Num frames 3300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:27,465][97397] Num frames 3400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:27,710][97397] Num frames 3500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:27,951][97397] Num frames 3600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:28,225][97397] Num frames 3700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:28,516][97397] Num frames 3800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:28,765][97397] Num frames 3900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:29,034][97397] Num frames 4000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:29,303][97397] Num frames 4100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:29,566][97397] Num frames 4200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:29,808][97397] Num frames 4300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:30,057][97397] Num frames 4400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:30,295][97397] Num frames 4500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:30,535][97397] Num frames 4600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:30,782][97397] Num frames 4700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:31,013][97397] Num frames 4800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:31,286][97397] Num frames 4900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:31,539][97397] Num frames 5000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:31,791][97397] Num frames 5100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:32,037][97397] Num frames 5200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:32,298][97397] Num frames 5300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:32,537][97397] Num frames 5400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:32,805][97397] Num frames 5500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:33,061][97397] Num frames 5600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:33,340][97397] Num frames 5700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:33,586][97397] Num frames 5800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:33,817][97397] Num frames 5900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:34,076][97397] Num frames 6000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:34,392][97397] Num frames 6100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:34,637][97397] Num frames 6200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:34,906][97397] Num frames 6300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:35,135][97397] Num frames 6400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:35,393][97397] Num frames 6500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:35,640][97397] Num frames 6600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:35,896][97397] Num frames 6700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:36,136][97397] Num frames 6800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:36,355][97397] Num frames 6900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:36,596][97397] Num frames 7000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:36,863][97397] Num frames 7100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:37,149][97397] Num frames 7200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:37,424][97397] Num frames 7300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:37,691][97397] Num frames 7400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:37,951][97397] Num frames 7500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:38,265][97397] Num frames 7600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:38,525][97397] Num frames 7700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:38,763][97397] Num frames 7800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:38,998][97397] Num frames 7900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:39,260][97397] Num frames 8000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:39,544][97397] Num frames 8100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:39,816][97397] Num frames 8200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:40,090][97397] Num frames 8300...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:40,347][97397] DAMAGECOUNT value on done: 0.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:40,347][97397] DAMAGECOUNT value on done: 12.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:40,349][97397] Sum rewards: 14.318, reward structure: {'HEALTH': '-1.120', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'AMMO5': '0.003', 'AMMO2': '0.014', 'AMMO3': '0.040', 'AMMO4': '0.069', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.400', 'weapon5': '0.574', 'weapon4': '0.602', 'weapon2': '1.536', 'weapon3': '13.002'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:40,416][97397] Avg episode rewards: #0: 10.216, #1: 14.318, true rewards: #0: 1.000, #1: 0.000\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:03:40,418][97397] Avg episode reward: 12.267, avg true_objective: 0.500\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:40,425][97397] Num frames 8400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:40,697][97397] Num frames 8500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:40,965][97397] Num frames 8600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:41,246][97397] Num frames 8700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:41,492][97397] Num frames 8800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:41,750][97397] Num frames 8900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:41,980][97397] Num frames 9000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:42,252][97397] Num frames 9100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:42,507][97397] Num frames 9200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:42,768][97397] Num frames 9300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:43,083][97397] Num frames 9400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:43,342][97397] Num frames 9500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:43,577][97397] Num frames 9600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:43,847][97397] Num frames 9700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:44,132][97397] Num frames 9800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:44,614][97397] Num frames 9900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:44,935][97397] Num frames 10000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:45,280][97397] Num frames 10100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:45,680][97397] Num frames 10200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:45,980][97397] Num frames 10300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:46,271][97397] Num frames 10400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:46,586][97397] Num frames 10500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:47,011][97397] Num frames 10600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:47,368][97397] Num frames 10700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:47,759][97397] Num frames 10800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:48,043][97397] Num frames 10900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:48,392][97397] Num frames 11000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:48,754][97397] Num frames 11100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:49,028][97397] Num frames 11200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:49,362][97397] Num frames 11300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:49,662][97397] Num frames 11400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:49,936][97397] Num frames 11500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:50,173][97397] Num frames 11600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:50,426][97397] Num frames 11700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:50,689][97397] Num frames 11800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:51,025][97397] Num frames 11900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:51,312][97397] Num frames 12000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:51,569][97397] Num frames 12100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:51,833][97397] Num frames 12200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:52,066][97397] Num frames 12300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:52,306][97397] Num frames 12400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:52,541][97397] Num frames 12500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:52,842][97397] Num frames 12600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:53,109][97397] Num frames 12700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:53,358][97397] Num frames 12800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:53,661][97397] Num frames 12900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:53,950][97397] Num frames 13000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:54,218][97397] Num frames 13100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:54,507][97397] Num frames 13200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:54,814][97397] Num frames 13300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:55,075][97397] Num frames 13400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:55,346][97397] Num frames 13500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:55,638][97397] Num frames 13600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:55,960][97397] Num frames 13700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:56,267][97397] Num frames 13800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:56,540][97397] Num frames 13900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:56,852][97397] Num frames 14000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:57,123][97397] Num frames 14100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:57,382][97397] Num frames 14200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:57,680][97397] Num frames 14300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:57,960][97397] Num frames 14400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:58,234][97397] Num frames 14500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:58,529][97397] Num frames 14600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:58,825][97397] Num frames 14700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:59,128][97397] Num frames 14800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:59,445][97397] Num frames 14900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:59,717][97397] Num frames 15000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:03:59,982][97397] Num frames 15100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:00,232][97397] Num frames 15200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:00,507][97397] Num frames 15300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:00,764][97397] Num frames 15400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:01,001][97397] Num frames 15500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:01,293][97397] Num frames 15600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:01,557][97397] Num frames 15700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:01,944][97397] Num frames 15800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:02,232][97397] Num frames 15900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:02,472][97397] Num frames 16000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:02,712][97397] Num frames 16100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:02,938][97397] Num frames 16200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:03,185][97397] Num frames 16300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:03,427][97397] Num frames 16400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:03,697][97397] Num frames 16500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:03,945][97397] Num frames 16600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:04,170][97397] Num frames 16700...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:04,458][97397] DAMAGECOUNT value on done: 45.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:04,458][97397] DAMAGECOUNT value on done: 37.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:04,460][97397] Sum rewards: 14.910, reward structure: {'HEALTH': '-1.100', 'DEATHCOUNT': '-1.000', 'FRAGCOUNT': '-0.001', 'HITCOUNT': '0.000', 'AMMO5': '0.007', 'AMMO2': '0.025', 'AMMO3': '0.040', 'AMMO4': '0.123', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.450', 'weapon5': '0.666', 'weapon2': '0.872', 'weapon4': '1.078', 'weapon3': '12.950'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:04,523][97397] Avg episode rewards: #0: 11.004, #1: 14.613, true rewards: #0: 1.000, #1: 0.000\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:04,524][97397] Avg episode reward: 12.809, avg true_objective: 0.500\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:04,537][97397] Num frames 16800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:04,881][97397] Num frames 16900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:05,221][97397] Num frames 17000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:05,516][97397] Num frames 17100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:05,777][97397] Num frames 17200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:06,013][97397] Num frames 17300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:06,260][97397] Num frames 17400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:06,504][97397] Num frames 17500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:06,754][97397] Num frames 17600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:07,073][97397] Num frames 17700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:07,350][97397] Num frames 17800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:07,602][97397] Num frames 17900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:07,903][97397] Num frames 18000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:08,237][97397] Num frames 18100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:08,546][97397] Num frames 18200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:08,776][97397] Num frames 18300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:09,022][97397] Num frames 18400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:09,275][97397] Num frames 18500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:09,543][97397] Num frames 18600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:09,797][97397] Num frames 18700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:10,062][97397] Num frames 18800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:10,307][97397] Num frames 18900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:10,568][97397] Num frames 19000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:10,864][97397] Num frames 19100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:11,098][97397] Num frames 19200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:11,396][97397] Num frames 19300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:11,632][97397] Num frames 19400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:11,889][97397] Num frames 19500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:12,112][97397] Num frames 19600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:12,361][97397] Num frames 19700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:12,616][97397] Num frames 19800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:12,868][97397] Num frames 19900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:13,164][97397] Num frames 20000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:13,401][97397] Num frames 20100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:13,650][97397] Num frames 20200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:13,878][97397] Num frames 20300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:14,130][97397] Num frames 20400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:14,401][97397] Num frames 20500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:14,646][97397] Num frames 20600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:14,916][97397] Num frames 20700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:15,199][97397] Num frames 20800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:15,466][97397] Num frames 20900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:15,720][97397] Num frames 21000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:15,953][97397] Num frames 21100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:16,210][97397] Num frames 21200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:16,473][97397] Num frames 21300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:16,712][97397] Num frames 21400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:16,936][97397] Num frames 21500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:17,181][97397] Num frames 21600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:17,431][97397] Num frames 21700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:17,711][97397] Num frames 21800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:17,973][97397] Num frames 21900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:18,290][97397] Num frames 22000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:18,536][97397] Num frames 22100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:18,792][97397] Num frames 22200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:19,032][97397] Num frames 22300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:19,304][97397] Num frames 22400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:19,551][97397] Num frames 22500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:19,780][97397] Num frames 22600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:20,016][97397] Num frames 22700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:20,259][97397] Num frames 22800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:20,493][97397] Num frames 22900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:20,774][97397] Num frames 23000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:21,015][97397] Num frames 23100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:21,284][97397] Num frames 23200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:21,520][97397] Num frames 23300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:21,777][97397] Num frames 23400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:22,013][97397] Num frames 23500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:22,246][97397] Num frames 23600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:22,481][97397] Num frames 23700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:22,716][97397] Num frames 23800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:22,938][97397] Num frames 23900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:23,165][97397] Num frames 24000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:23,417][97397] Num frames 24100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:23,651][97397] Num frames 24200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:23,888][97397] Num frames 24300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:24,136][97397] Num frames 24400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:24,426][97397] Num frames 24500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:24,698][97397] Num frames 24600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:24,977][97397] Num frames 24700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:25,257][97397] Num frames 24800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:25,561][97397] Num frames 24900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:25,820][97397] Num frames 25000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:26,061][97397] Num frames 25100...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:26,287][97397] DAMAGECOUNT value on done: 57.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:26,287][97397] DAMAGECOUNT value on done: 92.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:26,289][97397] Sum rewards: 9.675, reward structure: {'HEALTH': '-1.470', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO3': '0.020', 'AMMO4': '0.025', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.194', 'WEAPON3': '0.200', 'DAMAGECOUNT': '0.200', 'FRAGCOUNT': '0.999', 'weapon4': '1.842', 'weapon3': '3.908', 'weapon2': '4.548'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:26,349][97397] Avg episode rewards: #0: 10.561, #1: 14.175, true rewards: #0: 0.667, #1: 0.000\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:26,350][97397] Avg episode reward: 12.368, avg true_objective: 0.333\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:26,366][97397] Num frames 25200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:26,632][97397] Num frames 25300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:26,901][97397] Num frames 25400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:27,185][97397] Num frames 25500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:27,438][97397] Num frames 25600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:27,679][97397] Num frames 25700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:27,927][97397] Num frames 25800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:28,205][97397] Num frames 25900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:28,498][97397] Num frames 26000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:28,782][97397] Num frames 26100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:29,072][97397] Num frames 26200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:29,342][97397] Num frames 26300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:29,583][97397] Num frames 26400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:29,847][97397] Num frames 26500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:30,142][97397] Num frames 26600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:30,414][97397] Num frames 26700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:30,661][97397] Num frames 26800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:30,920][97397] Num frames 26900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:31,202][97397] Num frames 27000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:31,434][97397] Num frames 27100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:31,674][97397] Num frames 27200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:31,932][97397] Num frames 27300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:32,167][97397] Num frames 27400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:32,386][97397] Num frames 27500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:32,608][97397] Num frames 27600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:32,825][97397] Num frames 27700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:33,072][97397] Num frames 27800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:33,312][97397] Num frames 27900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:33,547][97397] Num frames 28000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:33,792][97397] Num frames 28100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:34,030][97397] Num frames 28200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:34,284][97397] Num frames 28300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:34,553][97397] Num frames 28400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:34,800][97397] Num frames 28500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:35,057][97397] Num frames 28600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:35,314][97397] Num frames 28700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:35,562][97397] Num frames 28800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:35,795][97397] Num frames 28900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:36,036][97397] Num frames 29000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:36,266][97397] Num frames 29100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:36,503][97397] Num frames 29200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:36,746][97397] Num frames 29300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:36,998][97397] Num frames 29400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:37,247][97397] Num frames 29500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:37,505][97397] Num frames 29600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:37,756][97397] Num frames 29700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:38,028][97397] Num frames 29800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:38,291][97397] Num frames 29900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:38,536][97397] Num frames 30000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:38,793][97397] Num frames 30100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:39,048][97397] Num frames 30200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:39,301][97397] Num frames 30300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:39,549][97397] Num frames 30400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:39,782][97397] Num frames 30500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:40,014][97397] Num frames 30600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:40,252][97397] Num frames 30700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:40,496][97397] Num frames 30800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:40,722][97397] Num frames 30900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:40,973][97397] Num frames 31000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:41,282][97397] Num frames 31100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:41,538][97397] Num frames 31200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:41,780][97397] Num frames 31300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:42,016][97397] Num frames 31400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:42,248][97397] Num frames 31500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:42,486][97397] Num frames 31600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:42,725][97397] Num frames 31700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:42,998][97397] Num frames 31800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:43,261][97397] Num frames 31900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:43,498][97397] Num frames 32000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:43,801][97397] Num frames 32100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:44,104][97397] Num frames 32200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:44,403][97397] Num frames 32300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:44,690][97397] Num frames 32400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:44,949][97397] Num frames 32500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:45,237][97397] Num frames 32600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:45,499][97397] Num frames 32700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:45,739][97397] Num frames 32800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:45,990][97397] Num frames 32900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:46,252][97397] Num frames 33000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:46,510][97397] Num frames 33100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:46,742][97397] Num frames 33200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:47,033][97397] Num frames 33300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:47,284][97397] Num frames 33400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:47,556][97397] Num frames 33500...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:47,799][97397] DAMAGECOUNT value on done: 342.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:47,800][97397] DAMAGECOUNT value on done: 107.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:47,801][97397] Sum rewards: 19.276, reward structure: {'HEALTH': '-1.150', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO5': '0.008', 'AMMO2': '0.011', 'AMMO3': '0.040', 'AMMO4': '0.056', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.374', 'WEAPON3': '0.400', 'weapon4': '1.230', 'weapon2': '1.394', 'FRAGCOUNT': '1.999', 'DAMAGECOUNT': '2.850', 'weapon3': '12.764'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:47,863][97397] Avg episode rewards: #0: 12.740, #1: 12.316, true rewards: #0: 0.750, #1: 0.000\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:04:47,865][97397] Avg episode reward: 12.528, avg true_objective: 0.375\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:47,884][97397] Num frames 33600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:48,124][97397] Num frames 33700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:48,385][97397] Num frames 33800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:48,615][97397] Num frames 33900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:48,862][97397] Num frames 34000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:49,148][97397] Num frames 34100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:49,425][97397] Num frames 34200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:49,708][97397] Num frames 34300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:49,987][97397] Num frames 34400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:50,243][97397] Num frames 34500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:50,486][97397] Num frames 34600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:50,725][97397] Num frames 34700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:50,991][97397] Num frames 34800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:51,270][97397] Num frames 34900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:51,520][97397] Num frames 35000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:51,790][97397] Num frames 35100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:52,028][97397] Num frames 35200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:52,275][97397] Num frames 35300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:52,520][97397] Num frames 35400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:52,760][97397] Num frames 35500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:52,998][97397] Num frames 35600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:53,236][97397] Num frames 35700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:53,470][97397] Num frames 35800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:53,703][97397] Num frames 35900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:53,944][97397] Num frames 36000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:54,174][97397] Num frames 36100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:54,436][97397] Num frames 36200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:54,682][97397] Num frames 36300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:54,947][97397] Num frames 36400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:55,210][97397] Num frames 36500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:55,472][97397] Num frames 36600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:55,704][97397] Num frames 36700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:55,952][97397] Num frames 36800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:56,178][97397] Num frames 36900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:56,405][97397] Num frames 37000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:56,635][97397] Num frames 37100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:56,856][97397] Num frames 37200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:57,121][97397] Num frames 37300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:57,391][97397] Num frames 37400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:57,621][97397] Num frames 37500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:57,859][97397] Num frames 37600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:58,130][97397] Num frames 37700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:58,382][97397] Num frames 37800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:58,604][97397] Num frames 37900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:58,870][97397] Num frames 38000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:59,131][97397] Num frames 38100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:59,383][97397] Num frames 38200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:59,626][97397] Num frames 38300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:04:59,862][97397] Num frames 38400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:00,101][97397] Num frames 38500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:00,343][97397] Num frames 38600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:00,567][97397] Num frames 38700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:00,801][97397] Num frames 38800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:01,050][97397] Num frames 38900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:01,337][97397] Num frames 39000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:01,608][97397] Num frames 39100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:01,865][97397] Num frames 39200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:02,116][97397] Num frames 39300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:02,357][97397] Num frames 39400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:02,605][97397] Num frames 39500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:02,832][97397] Num frames 39600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:03,081][97397] Num frames 39700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:03,342][97397] Num frames 39800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:03,623][97397] Num frames 39900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:03,923][97397] Num frames 40000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:04,190][97397] Num frames 40100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:04,551][97397] Num frames 40200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:04,831][97397] Num frames 40300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:05,082][97397] Num frames 40400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:05,341][97397] Num frames 40500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:05,629][97397] Num frames 40600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:05,874][97397] Num frames 40700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:06,146][97397] Num frames 40800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:06,386][97397] Num frames 40900...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:06,633][97397] Num frames 41000...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:06,869][97397] Num frames 41100...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:07,142][97397] Num frames 41200...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:07,416][97397] Num frames 41300...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:07,719][97397] Num frames 41400...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:07,962][97397] Num frames 41500...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:08,222][97397] Num frames 41600...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:08,472][97397] Num frames 41700...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:08,727][97397] Num frames 41800...\u001b[0m\n", + "\u001b[36m[2023-09-14 12:05:08,963][97397] Num frames 41900...\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:05:09,207][97397] DAMAGECOUNT value on done: 442.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:05:09,207][97397] DAMAGECOUNT value on done: 282.0\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:05:09,208][97397] Sum rewards: 12.061, reward structure: {'HEALTH': '-2.400', 'DEATHCOUNT': '-2.000', 'HITCOUNT': '0.000', 'AMMO5': '0.003', 'AMMO2': '0.004', 'AMMO4': '0.020', 'AMMO3': '0.050', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'WEAPON3': '0.400', 'weapon5': '0.556', 'FRAGCOUNT': '0.999', 'DAMAGECOUNT': '1.000', 'weapon4': '1.958', 'weapon2': '2.464', 'weapon3': '8.806'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:05:09,209][97397] Sum rewards: 11.181, reward structure: {'HEALTH': '-1.000', 'DEATHCOUNT': '-1.000', 'HITCOUNT': '0.000', 'AMMO2': '0.005', 'AMMO4': '0.025', 'AMMO3': '0.037', 'WEAPON4': '0.100', 'WEAPON3': '0.300', 'weapon4': '0.702', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.750', 'weapon2': '3.640', 'weapon3': '5.622'}\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:05:09,273][97397] Avg episode rewards: #0: 12.604, #1: 12.089, true rewards: #0: 0.600, #1: 0.200\u001b[0m\n", + "\u001b[37m\u001b[1m[2023-09-14 12:05:09,275][97397] Avg episode reward: 12.346, avg true_objective: 0.400\u001b[0m\n" ] }, { - "ename": "TypeError", - "evalue": "'NoneType' object is not subscriptable", + "ename": "", + "evalue": "", "output_type": "error", "traceback": [ - "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", - "\u001b[0;31mTypeError\u001b[0m Traceback (most recent call last)", - "Cell \u001b[0;32mIn[5], line 6\u001b[0m\n\u001b[1;32m 1\u001b[0m \u001b[38;5;28;01mfrom\u001b[39;00m \u001b[38;5;21;01msample_factory\u001b[39;00m\u001b[38;5;21;01m.\u001b[39;00m\u001b[38;5;21;01menjoy\u001b[39;00m \u001b[38;5;28;01mimport\u001b[39;00m enjoy\n\u001b[1;32m 3\u001b[0m cfg \u001b[38;5;241m=\u001b[39m parse_vizdoom_cfg(\n\u001b[1;32m 4\u001b[0m argv\u001b[38;5;241m=\u001b[39m[\u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m--env=\u001b[39m\u001b[38;5;132;01m{\u001b[39;00menv\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m--num_workers=1\u001b[39m\u001b[38;5;124m\"\u001b[39m, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m--save_video\u001b[39m\u001b[38;5;124m\"\u001b[39m, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m--no_render\u001b[39m\u001b[38;5;124m\"\u001b[39m, \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m--max_num_episodes=10\u001b[39m\u001b[38;5;124m\"\u001b[39m], evaluation\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m\n\u001b[1;32m 5\u001b[0m )\n\u001b[0;32m----> 6\u001b[0m status \u001b[38;5;241m=\u001b[39m \u001b[43menjoy\u001b[49m\u001b[43m(\u001b[49m\u001b[43mcfg\u001b[49m\u001b[43m)\u001b[49m\n", - "File \u001b[0;32m~/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/enjoy.py:125\u001b[0m, in \u001b[0;36menjoy\u001b[0;34m(cfg)\u001b[0m\n\u001b[1;32m 123\u001b[0m checkpoints \u001b[38;5;241m=\u001b[39m Learner\u001b[38;5;241m.\u001b[39mget_checkpoints(Learner\u001b[38;5;241m.\u001b[39mcheckpoint_dir(cfg, policy_id), \u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;132;01m{\u001b[39;00mname_prefix\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m_*\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m 124\u001b[0m checkpoint_dict \u001b[38;5;241m=\u001b[39m Learner\u001b[38;5;241m.\u001b[39mload_checkpoint(checkpoints, device)\n\u001b[0;32m--> 125\u001b[0m actor_critic\u001b[38;5;241m.\u001b[39mload_state_dict(\u001b[43mcheckpoint_dict\u001b[49m\u001b[43m[\u001b[49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[38;5;124;43mmodel\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[43m]\u001b[49m)\n\u001b[1;32m 127\u001b[0m episode_rewards \u001b[38;5;241m=\u001b[39m [deque([], maxlen\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m100\u001b[39m) \u001b[38;5;28;01mfor\u001b[39;00m _ \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mrange\u001b[39m(env\u001b[38;5;241m.\u001b[39mnum_agents)]\n\u001b[1;32m 128\u001b[0m true_objectives \u001b[38;5;241m=\u001b[39m [deque([], maxlen\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m100\u001b[39m) \u001b[38;5;28;01mfor\u001b[39;00m _ \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mrange\u001b[39m(env\u001b[38;5;241m.\u001b[39mnum_agents)]\n", - "\u001b[0;31mTypeError\u001b[0m: 'NoneType' object is not subscriptable" + "\u001b[1;31mThe Kernel crashed while executing code in the the current cell or a previous cell. Please review the code in the cell(s) to identify a possible cause of the failure. Click here for more info. View Jupyter log for further details." ] } ], @@ -7106,9 +7449,24 @@ }, { "cell_type": "code", - "execution_count": null, + "execution_count": 1, "metadata": {}, - "outputs": [], + "outputs": [ + { + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "8e0e4af164c84f76a7d7ed1ec726fc6b", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "VBox(children=(HTML(value='
#0:0 (mpeg4 (native) -> h264 (libx264))\n", + "Press [q] to stop, [?] for help\n", + "[libx264 @ 0x562daca499c0] using SAR=1/1\n", + "[libx264 @ 0x562daca499c0] using cpu capabilities: MMX2 SSE2Fast SSSE3 SSE4.2 AVX FMA3 BMI2 AVX2 AVX512\n", + "[libx264 @ 0x562daca499c0] profile High, level 1.3\n", + "[libx264 @ 0x562daca499c0] 264 - core 155 r2917 0a84d98 - H.264/MPEG-4 AVC codec - Copyleft 2003-2018 - http://www.videolan.org/x264.html - options: cabac=1 ref=3 deblock=1:0:0 analyse=0x3:0x113 me=hex subme=7 psy=1 psy_rd=1.00:0.00 mixed_ref=1 me_range=16 chroma_me=1 trellis=1 8x8dct=1 cqm=0 deadzone=21,11 fast_pskip=1 chroma_qp_offset=-2 threads=6 lookahead_threads=1 sliced_threads=0 nr=0 decimate=1 interlaced=0 bluray_compat=0 constrained_intra=0 bframes=3 b_pyramid=2 b_adapt=1 b_bias=0 direct=1 weightb=1 open_gop=0 weightp=2 keyint=250 keyint_min=25 scenecut=40 intra_refresh=0 rc_lookahead=40 rc=crf mbtree=1 crf=23.0 qcomp=0.60 qpmin=0 qpmax=69 qpstep=4 ip_ratio=1.40 aq=1:1.00\n", + "Output #0, mp4, to '/home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/replay.mp4':\n", + " Metadata:\n", + " major_brand : isom\n", + " minor_version : 512\n", + " compatible_brands: isomiso2mp41\n", + " encoder : Lavf58.29.100\n", + " Stream #0:0(und): Video: h264 (libx264) (avc1 / 0x31637661), yuv420p, 240x180 [SAR 1:1 DAR 4:3], q=-1--1, 35 fps, 17920 tbn, 35 tbc (default)\n", + " Metadata:\n", + " handler_name : VideoHandler\n", + " encoder : Lavc58.54.100 libx264\n", + " Side data:\n", + " cpb: bitrate max/min/avg: 0/0/0 buffer size: 0 vbv_delay: -1\n", + "frame=84002 fps=612 q=-1.0 Lsize= 143428kB time=00:39:59.97 bitrate= 489.6kbits/s speed=17.5x \n", + "video:142456kB audio:0kB subtitle:0kB other streams:0kB global headers:0kB muxing overhead: 0.682432%\n", + "[libx264 @ 0x562daca499c0] frame I:378 Avg QP:24.35 size: 8685\n", + "[libx264 @ 0x562daca499c0] frame P:23342 Avg QP:27.69 size: 2340\n", + "[libx264 @ 0x562daca499c0] frame B:60282 Avg QP:29.86 size: 1459\n", + "[libx264 @ 0x562daca499c0] consecutive B-frames: 3.3% 1.9% 3.6% 91.2%\n", + "[libx264 @ 0x562daca499c0] mb I I16..4: 0.7% 65.6% 33.7%\n", + "[libx264 @ 0x562daca499c0] mb P I16..4: 1.1% 24.0% 5.0% P16..4: 28.4% 16.4% 6.6% 0.0% 0.0% skip:18.5%\n", + "[libx264 @ 0x562daca499c0] mb B I16..4: 0.3% 6.1% 0.8% B16..8: 39.8% 15.1% 4.0% direct: 6.2% skip:27.6% L0:49.8% L1:44.3% BI: 5.9%\n", + "[libx264 @ 0x562daca499c0] 8x8 transform intra:81.1% inter:68.6%\n", + "[libx264 @ 0x562daca499c0] coded y,uvDC,uvAC intra: 89.6% 59.3% 24.3% inter: 42.0% 15.8% 2.6%\n", + "[libx264 @ 0x562daca499c0] i16 v,h,dc,p: 58% 25% 9% 9%\n", + "[libx264 @ 0x562daca499c0] i8 v,h,dc,ddl,ddr,vr,hd,vl,hu: 14% 14% 39% 5% 5% 4% 6% 5% 8%\n", + "[libx264 @ 0x562daca499c0] i4 v,h,dc,ddl,ddr,vr,hd,vl,hu: 27% 21% 17% 6% 6% 5% 7% 5% 6%\n", + "[libx264 @ 0x562daca499c0] i8c dc,h,v,p: 64% 18% 16% 2%\n", + "[libx264 @ 0x562daca499c0] Weighted P-Frames: Y:0.1% UV:0.0%\n", + "[libx264 @ 0x562daca499c0] ref P L0: 49.0% 14.5% 22.4% 14.1% 0.0%\n", + "[libx264 @ 0x562daca499c0] ref B L0: 83.2% 12.7% 4.1%\n", + "[libx264 @ 0x562daca499c0] ref B L1: 93.9% 6.1%\n", + "[libx264 @ 0x562daca499c0] kb/s:486.24\n", + "\u001b[36m[2023-09-14 15:13:58,203][109198] Replay video saved to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/replay.mp4!\u001b[0m\n" ] }, { - "ename": "TypeError", - "evalue": "'NoneType' object is not subscriptable", - "output_type": "error", - "traceback": [ - "\u001b[0;31m---------------------------------------------------------------------------\u001b[0m", - "\u001b[0;31mTypeError\u001b[0m Traceback (most recent call last)", - "Cell \u001b[0;32mIn[8], line 18\u001b[0m\n\u001b[1;32m 3\u001b[0m hf_username \u001b[38;5;241m=\u001b[39m \u001b[38;5;124m\"\u001b[39m\u001b[38;5;124mMattStammers\u001b[39m\u001b[38;5;124m\"\u001b[39m \u001b[38;5;66;03m# insert your HuggingFace username here\u001b[39;00m\n\u001b[1;32m 5\u001b[0m cfg \u001b[38;5;241m=\u001b[39m parse_vizdoom_cfg(\n\u001b[1;32m 6\u001b[0m argv\u001b[38;5;241m=\u001b[39m[\n\u001b[1;32m 7\u001b[0m \u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;124m--env=\u001b[39m\u001b[38;5;132;01m{\u001b[39;00menv\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m\"\u001b[39m,\n\u001b[0;32m (...)\u001b[0m\n\u001b[1;32m 16\u001b[0m evaluation\u001b[38;5;241m=\u001b[39m\u001b[38;5;28;01mTrue\u001b[39;00m,\n\u001b[1;32m 17\u001b[0m )\n\u001b[0;32m---> 18\u001b[0m status \u001b[38;5;241m=\u001b[39m \u001b[43menjoy\u001b[49m\u001b[43m(\u001b[49m\u001b[43mcfg\u001b[49m\u001b[43m)\u001b[49m\n", - "File \u001b[0;32m~/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/enjoy.py:125\u001b[0m, in \u001b[0;36menjoy\u001b[0;34m(cfg)\u001b[0m\n\u001b[1;32m 123\u001b[0m checkpoints \u001b[38;5;241m=\u001b[39m Learner\u001b[38;5;241m.\u001b[39mget_checkpoints(Learner\u001b[38;5;241m.\u001b[39mcheckpoint_dir(cfg, policy_id), \u001b[38;5;124mf\u001b[39m\u001b[38;5;124m\"\u001b[39m\u001b[38;5;132;01m{\u001b[39;00mname_prefix\u001b[38;5;132;01m}\u001b[39;00m\u001b[38;5;124m_*\u001b[39m\u001b[38;5;124m\"\u001b[39m)\n\u001b[1;32m 124\u001b[0m checkpoint_dict \u001b[38;5;241m=\u001b[39m Learner\u001b[38;5;241m.\u001b[39mload_checkpoint(checkpoints, device)\n\u001b[0;32m--> 125\u001b[0m actor_critic\u001b[38;5;241m.\u001b[39mload_state_dict(\u001b[43mcheckpoint_dict\u001b[49m\u001b[43m[\u001b[49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[38;5;124;43mmodel\u001b[39;49m\u001b[38;5;124;43m\"\u001b[39;49m\u001b[43m]\u001b[49m)\n\u001b[1;32m 127\u001b[0m episode_rewards \u001b[38;5;241m=\u001b[39m [deque([], maxlen\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m100\u001b[39m) \u001b[38;5;28;01mfor\u001b[39;00m _ \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mrange\u001b[39m(env\u001b[38;5;241m.\u001b[39mnum_agents)]\n\u001b[1;32m 128\u001b[0m true_objectives \u001b[38;5;241m=\u001b[39m [deque([], maxlen\u001b[38;5;241m=\u001b[39m\u001b[38;5;241m100\u001b[39m) \u001b[38;5;28;01mfor\u001b[39;00m _ \u001b[38;5;129;01min\u001b[39;00m \u001b[38;5;28mrange\u001b[39m(env\u001b[38;5;241m.\u001b[39mnum_agents)]\n", - "\u001b[0;31mTypeError\u001b[0m: 'NoneType' object is not subscriptable" - ] + "data": { + "application/vnd.jupyter.widget-view+json": { + "model_id": "25b118b82e0a48e7983fd116fc6b05ea", + "version_major": 2, + "version_minor": 0 + }, + "text/plain": [ + "checkpoint_000002343_9596928.pth: 0%| | 0.00/37.7M [00:00 --algo=APPO --env=doom_health_gathering_supreme --train_dir=./train_dir --experiment=rl_course_vizdoom_health_gathering_supreme --``` -- -- --You can also upload models to the Hugging Face Hub using the same script with the `--push_to_hub` flag. --See https://www.samplefactory.dev/10-huggingface/huggingface/ for more details -- --## Training with this model -- --To continue training with this model, use the `train` script corresponding to this environment: --``` --python -m --algo=APPO --env=doom_health_gathering_supreme --train_dir=./train_dir --experiment=rl_course_vizdoom_health_gathering_supreme --restart_behavior=resume --train_for_env_steps=10000000000 --``` -- --Note, you may have to adjust `--train_for_env_steps` to a su \ No newline at end of file diff --git a/environments/sample_factory/train_dir/default_experiment/sf_log.txt b/environments/sample_factory/train_dir/default_experiment/sf_log.txt index 4a0823e..4f05227 100644 --- a/environments/sample_factory/train_dir/default_experiment/sf_log.txt +++ b/environments/sample_factory/train_dir/default_experiment/sf_log.txt @@ -1,40 +1,17 @@ -[2023-09-12 18:21:38,856][129210] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... -[2023-09-12 18:21:39,863][129210] Rollout worker 0 uses device cpu -[2023-09-12 18:21:39,865][129210] Rollout worker 1 uses device cpu -[2023-09-12 18:21:39,866][129210] Rollout worker 2 uses device cpu -[2023-09-12 18:21:39,867][129210] Rollout worker 3 uses device cpu -[2023-09-12 18:21:39,869][129210] Rollout worker 4 uses device cpu -[2023-09-12 18:21:39,871][129210] Rollout worker 5 uses device cpu -[2023-09-12 18:21:39,872][129210] Rollout worker 6 uses device cpu -[2023-09-12 18:21:39,874][129210] Rollout worker 7 uses device cpu -[2023-09-12 18:21:40,076][129210] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 18:21:40,077][129210] InferenceWorker_p0-w0: min num requests: 2 -[2023-09-12 18:21:40,103][129210] Starting all processes... -[2023-09-12 18:21:40,104][129210] Starting process learner_proc0 -[2023-09-12 18:21:41,823][129907] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 18:21:41,823][129907] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 -[2023-09-12 18:21:41,822][129210] Starting all processes... -[2023-09-12 18:21:41,829][129210] Starting process inference_proc0-0 -[2023-09-12 18:21:41,830][129210] Starting process rollout_proc0 -[2023-09-12 18:21:41,831][129210] Starting process rollout_proc1 -[2023-09-12 18:21:41,831][129210] Starting process rollout_proc2 -[2023-09-12 18:21:41,835][129210] Starting process rollout_proc3 -[2023-09-12 18:21:41,835][129210] Starting process rollout_proc4 -[2023-09-12 18:21:41,862][129907] Num visible devices: 1 -[2023-09-12 18:21:41,904][129907] Starting seed is not provided -[2023-09-12 18:21:41,904][129907] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 18:21:41,904][129907] Initializing actor-critic model on device cuda:0 -[2023-09-12 18:21:41,905][129907] RunningMeanStd input shape: (23,) -[2023-09-12 18:21:41,905][129907] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 18:21:41,905][129907] RunningMeanStd input shape: (1,) -[2023-09-12 18:21:41,836][129210] Starting process rollout_proc5 -[2023-09-12 18:21:41,836][129210] Starting process rollout_proc6 -[2023-09-12 18:21:41,918][129907] ConvEncoder: input_channels=3 -[2023-09-12 18:21:41,837][129210] Starting process rollout_proc7 -[2023-09-12 18:21:42,076][129907] Conv encoder output size: 512 -[2023-09-12 18:21:42,077][129907] Policy head output size: 640 -[2023-09-12 18:21:42,094][129907] Created Actor Critic model with architecture: -[2023-09-12 18:21:42,094][129907] ActorCriticSharedWeights( +[2023-09-14 14:36:31,459][63454] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 14:36:31,459][63454] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 +[2023-09-14 14:36:31,477][63454] Num visible devices: 1 +[2023-09-14 14:36:31,496][63454] Starting seed is not provided +[2023-09-14 14:36:31,496][63454] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 14:36:31,497][63454] Initializing actor-critic model on device cuda:0 +[2023-09-14 14:36:31,497][63454] RunningMeanStd input shape: (23,) +[2023-09-14 14:36:31,497][63454] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 14:36:31,498][63454] RunningMeanStd input shape: (1,) +[2023-09-14 14:36:31,509][63454] ConvEncoder: input_channels=3 +[2023-09-14 14:36:31,620][63454] Conv encoder output size: 512 +[2023-09-14 14:36:31,622][63454] Policy head output size: 640 +[2023-09-14 14:36:31,639][63454] Created Actor Critic model with architecture: +[2023-09-14 14:36:31,639][63454] ActorCriticSharedWeights( (obs_normalizer): ObservationNormalizer( (running_mean_std): RunningMeanStdDictInPlace( (running_mean_std): ModuleDict( @@ -79,1065 +56,29 @@ ) (critic_linear): Linear(in_features=512, out_features=1, bias=True) (action_parameterization): ActionParameterizationDefault( - (distribution_linear): Linear(in_features=512, out_features=15, bias=True) + (distribution_linear): Linear(in_features=512, out_features=39, bias=True) ) ) -[2023-09-12 18:21:43,441][129907] Using optimizer -[2023-09-12 18:21:43,441][129907] No checkpoints found -[2023-09-12 18:21:43,441][129907] Did not load from checkpoint, starting from scratch! -[2023-09-12 18:21:43,442][129907] Initialized policy 0 weights for model version 0 -[2023-09-12 18:21:43,443][129907] LearnerWorker_p0 finished initialization! -[2023-09-12 18:21:43,444][129907] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 18:21:43,873][130109] Worker 4 uses CPU cores [16, 17, 18, 19] -[2023-09-12 18:21:43,874][130072] Worker 0 uses CPU cores [0, 1, 2, 3] -[2023-09-12 18:21:43,942][130142] Worker 6 uses CPU cores [24, 25, 26, 27] -[2023-09-12 18:21:43,964][130071] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 18:21:43,964][130071] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 -[2023-09-12 18:21:43,983][130071] Num visible devices: 1 -[2023-09-12 18:21:44,025][130106] Worker 1 uses CPU cores [4, 5, 6, 7] -[2023-09-12 18:21:44,079][130107] Worker 2 uses CPU cores [8, 9, 10, 11] -[2023-09-12 18:21:44,103][130108] Worker 5 uses CPU cores [20, 21, 22, 23] -[2023-09-12 18:21:44,167][130141] Worker 3 uses CPU cores [12, 13, 14, 15] -[2023-09-12 18:21:44,172][130143] Worker 7 uses CPU cores [28, 29, 30, 31] -[2023-09-12 18:21:44,655][129210] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 0. Throughput: 0: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:21:44,657][130071] RunningMeanStd input shape: (23,) -[2023-09-12 18:21:44,658][130071] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 18:21:44,658][130071] RunningMeanStd input shape: (1,) -[2023-09-12 18:21:44,671][130071] ConvEncoder: input_channels=3 -[2023-09-12 18:21:44,779][130071] Conv encoder output size: 512 -[2023-09-12 18:21:44,780][130071] Policy head output size: 640 -[2023-09-12 18:21:45,128][129210] Inference worker 0-0 is ready! -[2023-09-12 18:21:45,129][129210] All inference workers are ready! Signal rollout workers to start! -[2023-09-12 18:21:45,133][130106] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,135][130108] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,135][130107] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,135][130072] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,136][130109] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,136][130142] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,137][130141] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,137][130143] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,169][130108] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:21:45,170][130072] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:21:45,170][130109] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:21:45,170][130107] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:21:45,172][130108] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,173][130072] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,173][130109] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,173][130107] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,177][130106] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:21:45,181][130142] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:21:45,182][130106] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,186][130142] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,189][130143] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:21:45,189][130141] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:21:45,194][130141] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,194][130143] Multi agent env, num agents: 8 -[2023-09-12 18:21:45,203][130108] Port 40800 is available -[2023-09-12 18:21:45,204][130108] Using port 40800 -[2023-09-12 18:21:45,205][130109] Port 40700 is available -[2023-09-12 18:21:45,205][130109] Using port 40700 -[2023-09-12 18:21:45,205][130108] Initializing env for player 0, init_info: {'port': 40800}... -[2023-09-12 18:21:45,205][130072] Port 40300 is available -[2023-09-12 18:21:45,205][130072] Using port 40300 -[2023-09-12 18:21:45,206][130109] Initializing env for player 0, init_info: {'port': 40700}... -[2023-09-12 18:21:45,207][130072] Initializing env for player 0, init_info: {'port': 40300}... -[2023-09-12 18:21:45,208][130107] Port 40500 is available -[2023-09-12 18:21:45,208][130107] Using port 40500 -[2023-09-12 18:21:45,209][130107] Initializing env for player 0, init_info: {'port': 40500}... -[2023-09-12 18:21:45,220][130142] Port 40900 is available -[2023-09-12 18:21:45,220][130142] Using port 40900 -[2023-09-12 18:21:45,227][130106] Port 40400 is available -[2023-09-12 18:21:45,227][130106] Using port 40400 -[2023-09-12 18:21:45,228][130106] Initializing env for player 0, init_info: {'port': 40400}... -[2023-09-12 18:21:45,234][130108] Using port 40800 on host... -[2023-09-12 18:21:45,235][130072] Using port 40300 on host... -[2023-09-12 18:21:45,236][130109] Using port 40700 on host... -[2023-09-12 18:21:45,240][130143] Port 41000 is available -[2023-09-12 18:21:45,240][130143] Using port 41000 -[2023-09-12 18:21:45,241][130143] Initializing env for player 0, init_info: {'port': 41000}... -[2023-09-12 18:21:45,245][130107] Using port 40500 on host... -[2023-09-12 18:21:45,247][130141] Port 40600 is available -[2023-09-12 18:21:45,247][130141] Using port 40600 -[2023-09-12 18:21:45,248][130141] Initializing env for player 0, init_info: {'port': 40600}... -[2023-09-12 18:21:45,256][130108] Initializing env for player 1, init_info: {'port': 40800}... -[2023-09-12 18:21:45,256][130109] Initializing env for player 1, init_info: {'port': 40700}... -[2023-09-12 18:21:45,257][130072] Initializing env for player 1, init_info: {'port': 40300}... -[2023-09-12 18:21:45,260][130107] Initializing env for player 1, init_info: {'port': 40500}... -[2023-09-12 18:21:45,263][130106] Using port 40400 on host... -[2023-09-12 18:21:45,273][130143] Using port 41000 on host... -[2023-09-12 18:21:45,277][130141] Using port 40600 on host... -[2023-09-12 18:21:45,280][130106] Initializing env for player 1, init_info: {'port': 40400}... -[2023-09-12 18:21:45,291][130143] Initializing env for player 1, init_info: {'port': 41000}... -[2023-09-12 18:21:45,299][130141] Initializing env for player 1, init_info: {'port': 40600}... -[2023-09-12 18:21:45,306][130108] Initializing env for player 2, init_info: {'port': 40800}... -[2023-09-12 18:21:45,308][130072] Initializing env for player 2, init_info: {'port': 40300}... -[2023-09-12 18:21:45,309][130109] Initializing env for player 2, init_info: {'port': 40700}... -[2023-09-12 18:21:45,311][130107] Initializing env for player 2, init_info: {'port': 40500}... -[2023-09-12 18:21:45,333][130106] Initializing env for player 2, init_info: {'port': 40400}... -[2023-09-12 18:21:45,344][130143] Initializing env for player 2, init_info: {'port': 41000}... -[2023-09-12 18:21:45,349][130141] Initializing env for player 2, init_info: {'port': 40600}... -[2023-09-12 18:21:45,357][130108] Initializing env for player 3, init_info: {'port': 40800}... -[2023-09-12 18:21:45,358][130072] Initializing env for player 3, init_info: {'port': 40300}... -[2023-09-12 18:21:45,363][130107] Initializing env for player 3, init_info: {'port': 40500}... -[2023-09-12 18:21:45,366][130109] Initializing env for player 3, init_info: {'port': 40700}... -[2023-09-12 18:21:45,390][130106] Initializing env for player 3, init_info: {'port': 40400}... -[2023-09-12 18:21:45,401][130141] Initializing env for player 3, init_info: {'port': 40600}... -[2023-09-12 18:21:45,400][130143] Initializing env for player 3, init_info: {'port': 41000}... -[2023-09-12 18:21:45,416][130107] Initializing env for player 4, init_info: {'port': 40500}... -[2023-09-12 18:21:45,416][130109] Initializing env for player 4, init_info: {'port': 40700}... -[2023-09-12 18:21:45,421][130072] Initializing env for player 4, init_info: {'port': 40300}... -[2023-09-12 18:21:45,451][130143] Initializing env for player 4, init_info: {'port': 41000}... -[2023-09-12 18:21:45,461][130072] Initializing env for player 5, init_info: {'port': 40300}... -[2023-09-12 18:21:45,467][130109] Initializing env for player 5, init_info: {'port': 40700}... -[2023-09-12 18:21:45,467][130107] Initializing env for player 5, init_info: {'port': 40500}... -[2023-09-12 18:21:45,407][130108] Initializing env for player 4, init_info: {'port': 40800}... -[2023-09-12 18:21:45,471][130106] Initializing env for player 4, init_info: {'port': 40400}... -[2023-09-12 18:21:45,471][130141] Initializing env for player 4, init_info: {'port': 40600}... -[2023-09-12 18:21:45,471][130108] Initializing env for player 5, init_info: {'port': 40800}... -[2023-09-12 18:21:45,512][130072] Initializing env for player 6, init_info: {'port': 40300}... -[2023-09-12 18:21:45,507][130143] Initializing env for player 5, init_info: {'port': 41000}... -[2023-09-12 18:21:45,518][130109] Initializing env for player 6, init_info: {'port': 40700}... -[2023-09-12 18:21:45,521][130108] Initializing env for player 6, init_info: {'port': 40800}... -[2023-09-12 18:21:45,527][130141] Initializing env for player 5, init_info: {'port': 40600}... -[2023-09-12 18:21:45,539][130107] Initializing env for player 6, init_info: {'port': 40500}... -[2023-09-12 18:21:45,546][130106] Initializing env for player 5, init_info: {'port': 40400}... -[2023-09-12 18:21:45,556][130143] Initializing env for player 6, init_info: {'port': 41000}... -[2023-09-12 18:21:45,567][130072] Initializing env for player 7, init_info: {'port': 40300}... -[2023-09-12 18:21:45,571][130109] Initializing env for player 7, init_info: {'port': 40700}... -[2023-09-12 18:21:45,572][130108] Initializing env for player 7, init_info: {'port': 40800}... -[2023-09-12 18:21:45,580][130141] Initializing env for player 6, init_info: {'port': 40600}... -[2023-09-12 18:21:45,595][130106] Initializing env for player 6, init_info: {'port': 40400}... -[2023-09-12 18:21:45,595][130107] Initializing env for player 7, init_info: {'port': 40500}... -[2023-09-12 18:21:45,607][130143] Initializing env for player 7, init_info: {'port': 41000}... -[2023-09-12 18:21:45,627][130141] Initializing env for player 7, init_info: {'port': 40600}... -[2023-09-12 18:21:45,667][130106] Initializing env for player 7, init_info: {'port': 40400}... -[2023-09-12 18:21:46,929][130107] Initialized w:2 v:0 player:6 -[2023-09-12 18:21:46,930][130107] Initialized w:2 v:0 player:3 -[2023-09-12 18:21:46,931][130107] Initialized w:2 v:0 player:7 -[2023-09-12 18:21:46,930][130107] Initialized w:2 v:0 player:0 -[2023-09-12 18:21:46,931][130107] Initialized w:2 v:0 player:2 -[2023-09-12 18:21:46,931][130107] Initialized w:2 v:0 player:1 -[2023-09-12 18:21:46,932][130107] Initialized w:2 v:0 player:4 -[2023-09-12 18:21:46,932][130107] Initialized w:2 v:0 player:5 -[2023-09-12 18:21:46,934][130107] 8 agent workers initialized for env 2! -[2023-09-12 18:21:46,940][130142] Initializing env for player 0, init_info: {'port': 40900}... -[2023-09-12 18:21:46,982][130107] Decorrelating experience for 0 frames... -[2023-09-12 18:21:46,984][130142] Using port 40900 on host... -[2023-09-12 18:21:46,990][130142] Initializing env for player 1, init_info: {'port': 40900}... -[2023-09-12 18:21:47,009][130107] Port 40501 is available -[2023-09-12 18:21:47,009][130107] Using port 40501 -[2023-09-12 18:21:47,010][130107] Initializing env for player 0, init_info: {'port': 40501}... -[2023-09-12 18:21:47,040][130142] Initializing env for player 2, init_info: {'port': 40900}... -[2023-09-12 18:21:47,041][130107] Using port 40501 on host... -[2023-09-12 18:21:47,060][130107] Initializing env for player 1, init_info: {'port': 40501}... -[2023-09-12 18:21:47,092][130108] Initialized w:5 v:0 player:2 -[2023-09-12 18:21:47,094][130108] Initialized w:5 v:0 player:7 -[2023-09-12 18:21:47,095][130108] Initialized w:5 v:0 player:5 -[2023-09-12 18:21:47,095][130108] Initialized w:5 v:0 player:0 -[2023-09-12 18:21:47,095][130142] Initializing env for player 3, init_info: {'port': 40900}... -[2023-09-12 18:21:47,095][130108] Initialized w:5 v:0 player:4 -[2023-09-12 18:21:47,096][130108] Initialized w:5 v:0 player:6 -[2023-09-12 18:21:47,096][130108] Initialized w:5 v:0 player:3 -[2023-09-12 18:21:47,096][130108] Initialized w:5 v:0 player:1 -[2023-09-12 18:21:47,098][130108] 8 agent workers initialized for env 5! -[2023-09-12 18:21:47,110][130107] Initializing env for player 2, init_info: {'port': 40501}... -[2023-09-12 18:21:47,113][130143] Initialized w:7 v:0 player:1 -[2023-09-12 18:21:47,114][130143] Initialized w:7 v:0 player:0 -[2023-09-12 18:21:47,114][130143] Initialized w:7 v:0 player:5 -[2023-09-12 18:21:47,115][130143] Initialized w:7 v:0 player:3 -[2023-09-12 18:21:47,115][130143] Initialized w:7 v:0 player:2 -[2023-09-12 18:21:47,116][130143] Initialized w:7 v:0 player:6 -[2023-09-12 18:21:47,117][130143] Initialized w:7 v:0 player:7 -[2023-09-12 18:21:47,118][130143] Initialized w:7 v:0 player:4 -[2023-09-12 18:21:47,119][130143] 8 agent workers initialized for env 7! -[2023-09-12 18:21:47,126][130108] Decorrelating experience for 0 frames... -[2023-09-12 18:21:47,128][130108] Port 40801 is available -[2023-09-12 18:21:47,128][130108] Using port 40801 -[2023-09-12 18:21:47,129][130108] Initializing env for player 0, init_info: {'port': 40801}... -[2023-09-12 18:21:47,138][130106] Initialized w:1 v:0 player:4 -[2023-09-12 18:21:47,141][130106] Initialized w:1 v:0 player:7 -[2023-09-12 18:21:47,142][130106] Initialized w:1 v:0 player:5 -[2023-09-12 18:21:47,142][130106] Initialized w:1 v:0 player:3 -[2023-09-12 18:21:47,143][130142] Initializing env for player 4, init_info: {'port': 40900}... -[2023-09-12 18:21:47,143][130106] Initialized w:1 v:0 player:2 -[2023-09-12 18:21:47,144][130106] Initialized w:1 v:0 player:1 -[2023-09-12 18:21:47,145][130106] Initialized w:1 v:0 player:0 -[2023-09-12 18:21:47,145][130106] Initialized w:1 v:0 player:6 -[2023-09-12 18:21:47,146][130106] 8 agent workers initialized for env 1! -[2023-09-12 18:21:47,161][130107] Initializing env for player 3, init_info: {'port': 40501}... -[2023-09-12 18:21:47,173][130108] Using port 40801 on host... -[2023-09-12 18:21:47,173][130109] Initialized w:4 v:0 player:3 -[2023-09-12 18:21:47,176][130109] Initialized w:4 v:0 player:4 -[2023-09-12 18:21:47,176][130109] Initialized w:4 v:0 player:7 -[2023-09-12 18:21:47,179][130109] Initialized w:4 v:0 player:5 -[2023-09-12 18:21:47,180][130109] Initialized w:4 v:0 player:2 -[2023-09-12 18:21:47,180][130109] Initialized w:4 v:0 player:6 -[2023-09-12 18:21:47,182][130108] Initializing env for player 1, init_info: {'port': 40801}... -[2023-09-12 18:21:47,183][130109] Initialized w:4 v:0 player:0 -[2023-09-12 18:21:47,184][130109] Initialized w:4 v:0 player:1 -[2023-09-12 18:21:47,185][130109] 8 agent workers initialized for env 4! -[2023-09-12 18:21:47,185][130143] Decorrelating experience for 0 frames... -[2023-09-12 18:21:47,187][130143] Port 41001 is available -[2023-09-12 18:21:47,187][130143] Using port 41001 -[2023-09-12 18:21:47,188][130143] Initializing env for player 0, init_info: {'port': 41001}... -[2023-09-12 18:21:47,205][130072] Initialized w:0 v:0 player:2 -[2023-09-12 18:21:47,206][130072] Initialized w:0 v:0 player:4 -[2023-09-12 18:21:47,207][130142] Initializing env for player 5, init_info: {'port': 40900}... -[2023-09-12 18:21:47,206][130072] Initialized w:0 v:0 player:1 -[2023-09-12 18:21:47,206][130072] Initialized w:0 v:0 player:6 -[2023-09-12 18:21:47,206][130072] Initialized w:0 v:0 player:5 -[2023-09-12 18:21:47,207][130072] Initialized w:0 v:0 player:3 -[2023-09-12 18:21:47,207][130072] Initialized w:0 v:0 player:0 -[2023-09-12 18:21:47,207][130072] Initialized w:0 v:0 player:7 -[2023-09-12 18:21:47,210][130072] 8 agent workers initialized for env 0! -[2023-09-12 18:21:47,215][130107] Initializing env for player 4, init_info: {'port': 40501}... -[2023-09-12 18:21:47,232][130108] Initializing env for player 2, init_info: {'port': 40801}... -[2023-09-12 18:21:47,233][130141] Initialized w:3 v:0 player:1 -[2023-09-12 18:21:47,234][130143] Using port 41001 on host... -[2023-09-12 18:21:47,238][130141] Initialized w:3 v:0 player:0 -[2023-09-12 18:21:47,239][130141] Initialized w:3 v:0 player:6 -[2023-09-12 18:21:47,239][130141] Initialized w:3 v:0 player:7 -[2023-09-12 18:21:47,239][130141] Initialized w:3 v:0 player:3 -[2023-09-12 18:21:47,239][130141] Initialized w:3 v:0 player:2 -[2023-09-12 18:21:47,241][130106] Decorrelating experience for 0 frames... -[2023-09-12 18:21:47,239][130141] Initialized w:3 v:0 player:5 -[2023-09-12 18:21:47,239][130141] Initialized w:3 v:0 player:4 -[2023-09-12 18:21:47,242][130141] 8 agent workers initialized for env 3! -[2023-09-12 18:21:47,243][130106] Port 40401 is available -[2023-09-12 18:21:47,243][130106] Using port 40401 -[2023-09-12 18:21:47,243][130143] Initializing env for player 1, init_info: {'port': 41001}... -[2023-09-12 18:21:47,247][130142] Initializing env for player 6, init_info: {'port': 40900}... -[2023-09-12 18:21:47,258][130072] Decorrelating experience for 0 frames... -[2023-09-12 18:21:47,260][130072] Port 40301 is available -[2023-09-12 18:21:47,260][130072] Using port 40301 -[2023-09-12 18:21:47,261][130072] Initializing env for player 0, init_info: {'port': 40301}... -[2023-09-12 18:21:47,268][130109] Decorrelating experience for 0 frames... -[2023-09-12 18:21:47,269][130107] Initializing env for player 5, init_info: {'port': 40501}... -[2023-09-12 18:21:47,270][130109] Port 40701 is available -[2023-09-12 18:21:47,271][130109] Using port 40701 -[2023-09-12 18:21:47,271][130109] Initializing env for player 0, init_info: {'port': 40701}... -[2023-09-12 18:21:47,287][130108] Initializing env for player 3, init_info: {'port': 40801}... -[2023-09-12 18:21:47,299][130143] Initializing env for player 2, init_info: {'port': 41001}... -[2023-09-12 18:21:47,302][130109] Using port 40701 on host... -[2023-09-12 18:21:47,302][130141] Decorrelating experience for 0 frames... -[2023-09-12 18:21:47,303][130142] Initializing env for player 7, init_info: {'port': 40900}... -[2023-09-12 18:21:47,304][130141] Port 40601 is available -[2023-09-12 18:21:47,304][130141] Using port 40601 -[2023-09-12 18:21:47,305][130072] Using port 40301 on host... -[2023-09-12 18:21:47,314][130072] Initializing env for player 1, init_info: {'port': 40301}... -[2023-09-12 18:21:47,322][130109] Initializing env for player 1, init_info: {'port': 40701}... -[2023-09-12 18:21:47,343][130107] Initializing env for player 6, init_info: {'port': 40501}... -[2023-09-12 18:21:47,351][130143] Initializing env for player 3, init_info: {'port': 41001}... -[2023-09-12 18:21:47,349][130108] Initializing env for player 4, init_info: {'port': 40801}... -[2023-09-12 18:21:47,372][130072] Initializing env for player 2, init_info: {'port': 40301}... -[2023-09-12 18:21:47,379][130107] Initializing env for player 7, init_info: {'port': 40501}... -[2023-09-12 18:21:47,419][130108] Initializing env for player 5, init_info: {'port': 40801}... -[2023-09-12 18:21:47,376][130109] Initializing env for player 2, init_info: {'port': 40701}... -[2023-09-12 18:21:47,419][130143] Initializing env for player 4, init_info: {'port': 41001}... -[2023-09-12 18:21:47,427][130109] Initializing env for player 3, init_info: {'port': 40701}... -[2023-09-12 18:21:47,426][130072] Initializing env for player 3, init_info: {'port': 40301}... -[2023-09-12 18:21:47,475][130143] Initializing env for player 5, init_info: {'port': 41001}... -[2023-09-12 18:21:47,483][130108] Initializing env for player 6, init_info: {'port': 40801}... -[2023-09-12 18:21:47,485][130072] Initializing env for player 4, init_info: {'port': 40301}... -[2023-09-12 18:21:47,480][130109] Initializing env for player 4, init_info: {'port': 40701}... -[2023-09-12 18:21:47,526][130143] Initializing env for player 6, init_info: {'port': 41001}... -[2023-09-12 18:21:47,528][130109] Initializing env for player 5, init_info: {'port': 40701}... -[2023-09-12 18:21:47,532][130108] Initializing env for player 7, init_info: {'port': 40801}... -[2023-09-12 18:21:47,539][130072] Initializing env for player 5, init_info: {'port': 40301}... -[2023-09-12 18:21:47,579][130109] Initializing env for player 6, init_info: {'port': 40701}... -[2023-09-12 18:21:47,581][130143] Initializing env for player 7, init_info: {'port': 41001}... -[2023-09-12 18:21:47,590][130072] Initializing env for player 6, init_info: {'port': 40301}... -[2023-09-12 18:21:47,629][130109] Initializing env for player 7, init_info: {'port': 40701}... -[2023-09-12 18:21:47,640][130072] Initializing env for player 7, init_info: {'port': 40301}... -[2023-09-12 18:21:48,935][130107] Initialized w:2 v:1 player:6 -[2023-09-12 18:21:48,938][130107] Initialized w:2 v:1 player:5 -[2023-09-12 18:21:48,938][130107] Initialized w:2 v:1 player:3 -[2023-09-12 18:21:48,939][130107] Initialized w:2 v:1 player:0 -[2023-09-12 18:21:48,938][130107] Initialized w:2 v:1 player:1 -[2023-09-12 18:21:48,940][130107] Initialized w:2 v:1 player:7 -[2023-09-12 18:21:48,940][130107] Initialized w:2 v:1 player:4 -[2023-09-12 18:21:48,941][130107] Initialized w:2 v:1 player:2 -[2023-09-12 18:21:48,942][130107] 8 agent workers initialized for env 2! -[2023-09-12 18:21:48,961][130108] Initialized w:5 v:1 player:4 -[2023-09-12 18:21:48,961][130142] Initialized w:6 v:0 player:0 -[2023-09-12 18:21:48,961][130142] Initialized w:6 v:0 player:4 -[2023-09-12 18:21:48,962][130108] Initialized w:5 v:1 player:0 -[2023-09-12 18:21:48,962][130142] Initialized w:6 v:0 player:7 -[2023-09-12 18:21:48,962][130108] Initialized w:5 v:1 player:1 -[2023-09-12 18:21:48,963][130142] Initialized w:6 v:0 player:3 -[2023-09-12 18:21:48,963][130108] Initialized w:5 v:1 player:7 -[2023-09-12 18:21:48,963][130142] Initialized w:6 v:0 player:2 -[2023-09-12 18:21:48,963][130108] Initialized w:5 v:1 player:5 -[2023-09-12 18:21:48,963][130142] Initialized w:6 v:0 player:5 -[2023-09-12 18:21:48,963][130108] Initialized w:5 v:1 player:6 -[2023-09-12 18:21:48,964][130142] Initialized w:6 v:0 player:6 -[2023-09-12 18:21:48,963][130108] Initialized w:5 v:1 player:3 -[2023-09-12 18:21:48,964][130108] Initialized w:5 v:1 player:2 -[2023-09-12 18:21:48,964][130142] Initialized w:6 v:0 player:1 -[2023-09-12 18:21:48,965][130108] 8 agent workers initialized for env 5! -[2023-09-12 18:21:48,965][130143] Initialized w:7 v:1 player:6 -[2023-09-12 18:21:48,966][130142] 8 agent workers initialized for env 6! -[2023-09-12 18:21:48,966][130143] Initialized w:7 v:1 player:4 -[2023-09-12 18:21:48,966][130143] Initialized w:7 v:1 player:7 -[2023-09-12 18:21:48,968][130143] Initialized w:7 v:1 player:5 -[2023-09-12 18:21:48,966][130143] Initialized w:7 v:1 player:2 -[2023-09-12 18:21:48,966][130143] Initialized w:7 v:1 player:1 -[2023-09-12 18:21:48,968][130143] Initialized w:7 v:1 player:0 -[2023-09-12 18:21:48,968][130143] Initialized w:7 v:1 player:3 -[2023-09-12 18:21:48,970][130143] 8 agent workers initialized for env 7! -[2023-09-12 18:21:48,972][130106] Initializing env for player 0, init_info: {'port': 40401}... -[2023-09-12 18:21:49,000][130108] Decorrelating experience for 32 frames... -[2023-09-12 18:21:49,003][130143] Decorrelating experience for 32 frames... -[2023-09-12 18:21:49,007][130107] Decorrelating experience for 32 frames... -[2023-09-12 18:21:49,007][130142] Decorrelating experience for 0 frames... -[2023-09-12 18:21:49,009][130142] Port 40901 is available -[2023-09-12 18:21:49,009][130142] Using port 40901 -[2023-09-12 18:21:49,012][130106] Using port 40401 on host... -[2023-09-12 18:21:49,023][130106] Initializing env for player 1, init_info: {'port': 40401}... -[2023-09-12 18:21:49,073][130106] Initializing env for player 2, init_info: {'port': 40401}... -[2023-09-12 18:21:49,117][130072] Initialized w:0 v:1 player:2 -[2023-09-12 18:21:49,118][130072] Initialized w:0 v:1 player:5 -[2023-09-12 18:21:49,119][130072] Initialized w:0 v:1 player:4 -[2023-09-12 18:21:49,120][130072] Initialized w:0 v:1 player:6 -[2023-09-12 18:21:49,120][130072] Initialized w:0 v:1 player:3 -[2023-09-12 18:21:49,121][130072] Initialized w:0 v:1 player:1 -[2023-09-12 18:21:49,121][130072] Initialized w:0 v:1 player:0 -[2023-09-12 18:21:49,123][130072] Initialized w:0 v:1 player:7 -[2023-09-12 18:21:49,123][130072] 8 agent workers initialized for env 0! -[2023-09-12 18:21:49,133][130106] Initializing env for player 3, init_info: {'port': 40401}... -[2023-09-12 18:21:49,174][130072] Decorrelating experience for 32 frames... -[2023-09-12 18:21:49,183][130106] Initializing env for player 4, init_info: {'port': 40401}... -[2023-09-12 18:21:49,225][130109] Initialized w:4 v:1 player:3 -[2023-09-12 18:21:49,228][130109] Initialized w:4 v:1 player:4 -[2023-09-12 18:21:49,228][130109] Initialized w:4 v:1 player:1 -[2023-09-12 18:21:49,229][130109] Initialized w:4 v:1 player:7 -[2023-09-12 18:21:49,229][130109] Initialized w:4 v:1 player:0 -[2023-09-12 18:21:49,229][130109] Initialized w:4 v:1 player:5 -[2023-09-12 18:21:49,229][130109] Initialized w:4 v:1 player:6 -[2023-09-12 18:21:49,230][130109] Initialized w:4 v:1 player:2 -[2023-09-12 18:21:49,233][130109] 8 agent workers initialized for env 4! -[2023-09-12 18:21:49,235][130106] Initializing env for player 5, init_info: {'port': 40401}... -[2023-09-12 18:21:49,280][130141] Initializing env for player 0, init_info: {'port': 40601}... -[2023-09-12 18:21:49,287][130106] Initializing env for player 6, init_info: {'port': 40401}... -[2023-09-12 18:21:49,306][130109] Decorrelating experience for 32 frames... -[2023-09-12 18:21:49,319][130141] Using port 40601 on host... -[2023-09-12 18:21:49,330][130141] Initializing env for player 1, init_info: {'port': 40601}... -[2023-09-12 18:21:49,347][130106] Initializing env for player 7, init_info: {'port': 40401}... -[2023-09-12 18:21:49,381][130141] Initializing env for player 2, init_info: {'port': 40601}... -[2023-09-12 18:21:49,435][130141] Initializing env for player 3, init_info: {'port': 40601}... -[2023-09-12 18:21:49,448][130143] Multi agent env, num agents: 8 -[2023-09-12 18:21:49,487][130141] Initializing env for player 4, init_info: {'port': 40601}... -[2023-09-12 18:21:49,495][130143] Multi agent env, num agents: 8 -[2023-09-12 18:21:49,545][130143] Port 41002 is available -[2023-09-12 18:21:49,546][130143] Using port 41002 -[2023-09-12 18:21:49,546][130143] Initializing env for player 0, init_info: {'port': 41002}... -[2023-09-12 18:21:49,539][130141] Initializing env for player 5, init_info: {'port': 40601}... -[2023-09-12 18:21:49,564][130108] Multi agent env, num agents: 8 -[2023-09-12 18:21:49,591][130141] Initializing env for player 6, init_info: {'port': 40601}... -[2023-09-12 18:21:49,591][130143] Using port 41002 on host... -[2023-09-12 18:21:49,596][130072] Multi agent env, num agents: 8 -[2023-09-12 18:21:49,597][130143] Initializing env for player 1, init_info: {'port': 41002}... -[2023-09-12 18:21:49,610][130108] Multi agent env, num agents: 8 -[2023-09-12 18:21:49,636][130072] Multi agent env, num agents: 8 -[2023-09-12 18:21:49,643][130141] Initializing env for player 7, init_info: {'port': 40601}... -[2023-09-12 18:21:49,651][130143] Initializing env for player 2, init_info: {'port': 41002}... -[2023-09-12 18:21:49,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:21:49,676][130072] Port 40302 is available -[2023-09-12 18:21:49,676][130072] Using port 40302 -[2023-09-12 18:21:49,677][130072] Initializing env for player 0, init_info: {'port': 40302}... -[2023-09-12 18:21:49,685][130107] Multi agent env, num agents: 8 -[2023-09-12 18:21:49,699][130143] Initializing env for player 3, init_info: {'port': 41002}... -[2023-09-12 18:21:49,707][130108] Port 40802 is available -[2023-09-12 18:21:49,707][130108] Using port 40802 -[2023-09-12 18:21:49,708][130108] Initializing env for player 0, init_info: {'port': 40802}... -[2023-09-12 18:21:49,711][130109] Multi agent env, num agents: 8 -[2023-09-12 18:21:49,712][130072] Using port 40302 on host... -[2023-09-12 18:21:49,717][130107] Multi agent env, num agents: 8 -[2023-09-12 18:21:49,728][130072] Initializing env for player 1, init_info: {'port': 40302}... -[2023-09-12 18:21:49,742][130109] Multi agent env, num agents: 8 -[2023-09-12 18:21:49,747][130107] Port 40502 is available -[2023-09-12 18:21:49,748][130107] Using port 40502 -[2023-09-12 18:21:49,748][130143] Initializing env for player 4, init_info: {'port': 41002}... -[2023-09-12 18:21:49,748][130107] Initializing env for player 0, init_info: {'port': 40502}... -[2023-09-12 18:21:49,754][130108] Using port 40802 on host... -[2023-09-12 18:21:49,765][130108] Initializing env for player 1, init_info: {'port': 40802}... -[2023-09-12 18:21:49,773][130109] Port 40702 is available -[2023-09-12 18:21:49,774][130109] Using port 40702 -[2023-09-12 18:21:49,774][130109] Initializing env for player 0, init_info: {'port': 40702}... -[2023-09-12 18:21:49,777][130107] Using port 40502 on host... -[2023-09-12 18:21:49,781][130072] Initializing env for player 2, init_info: {'port': 40302}... -[2023-09-12 18:21:49,799][130143] Initializing env for player 5, init_info: {'port': 41002}... -[2023-09-12 18:21:49,799][130107] Initializing env for player 1, init_info: {'port': 40502}... -[2023-09-12 18:21:49,815][130108] Initializing env for player 2, init_info: {'port': 40802}... -[2023-09-12 18:21:49,818][130109] Using port 40702 on host... -[2023-09-12 18:21:49,831][130109] Initializing env for player 1, init_info: {'port': 40702}... -[2023-09-12 18:21:49,843][130072] Initializing env for player 3, init_info: {'port': 40302}... -[2023-09-12 18:21:49,851][130107] Initializing env for player 2, init_info: {'port': 40502}... -[2023-09-12 18:21:49,859][130143] Initializing env for player 6, init_info: {'port': 41002}... -[2023-09-12 18:21:49,886][130109] Initializing env for player 2, init_info: {'port': 40702}... -[2023-09-12 18:21:49,887][130108] Initializing env for player 3, init_info: {'port': 40802}... -[2023-09-12 18:21:49,889][130072] Initializing env for player 4, init_info: {'port': 40302}... -[2023-09-12 18:21:49,900][130107] Initializing env for player 3, init_info: {'port': 40502}... -[2023-09-12 18:21:49,911][130143] Initializing env for player 7, init_info: {'port': 41002}... -[2023-09-12 18:21:49,936][130108] Initializing env for player 4, init_info: {'port': 40802}... -[2023-09-12 18:21:49,947][130109] Initializing env for player 3, init_info: {'port': 40702}... -[2023-09-12 18:21:49,951][130072] Initializing env for player 5, init_info: {'port': 40302}... -[2023-09-12 18:21:49,972][130107] Initializing env for player 4, init_info: {'port': 40502}... -[2023-09-12 18:21:49,987][130108] Initializing env for player 5, init_info: {'port': 40802}... -[2023-09-12 18:21:49,999][130072] Initializing env for player 6, init_info: {'port': 40302}... -[2023-09-12 18:21:50,003][130109] Initializing env for player 4, init_info: {'port': 40702}... -[2023-09-12 18:21:50,015][130107] Initializing env for player 5, init_info: {'port': 40502}... -[2023-09-12 18:21:50,043][130108] Initializing env for player 6, init_info: {'port': 40802}... -[2023-09-12 18:21:50,048][130109] Initializing env for player 5, init_info: {'port': 40702}... -[2023-09-12 18:21:50,055][130072] Initializing env for player 7, init_info: {'port': 40302}... -[2023-09-12 18:21:50,068][130107] Initializing env for player 6, init_info: {'port': 40502}... -[2023-09-12 18:21:50,099][130109] Initializing env for player 6, init_info: {'port': 40702}... -[2023-09-12 18:21:50,103][130108] Initializing env for player 7, init_info: {'port': 40802}... -[2023-09-12 18:21:50,118][130107] Initializing env for player 7, init_info: {'port': 40502}... -[2023-09-12 18:21:50,184][130109] Initializing env for player 7, init_info: {'port': 40702}... -[2023-09-12 18:21:50,737][130106] Initialized w:1 v:1 player:4 -[2023-09-12 18:21:50,738][130106] Initialized w:1 v:1 player:5 -[2023-09-12 18:21:50,739][130106] Initialized w:1 v:1 player:6 -[2023-09-12 18:21:50,739][130106] Initialized w:1 v:1 player:2 -[2023-09-12 18:21:50,740][130106] Initialized w:1 v:1 player:7 -[2023-09-12 18:21:50,740][130106] Initialized w:1 v:1 player:0 -[2023-09-12 18:21:50,740][130106] Initialized w:1 v:1 player:3 -[2023-09-12 18:21:50,740][130106] Initialized w:1 v:1 player:1 -[2023-09-12 18:21:50,742][130106] 8 agent workers initialized for env 1! -[2023-09-12 18:21:50,774][130142] Initializing env for player 0, init_info: {'port': 40901}... -[2023-09-12 18:21:50,788][130106] Decorrelating experience for 32 frames... -[2023-09-12 18:21:50,804][130142] Using port 40901 on host... -[2023-09-12 18:21:50,825][130142] Initializing env for player 1, init_info: {'port': 40901}... -[2023-09-12 18:21:50,880][130142] Initializing env for player 2, init_info: {'port': 40901}... -[2023-09-12 18:21:50,935][130142] Initializing env for player 3, init_info: {'port': 40901}... -[2023-09-12 18:21:50,991][130142] Initializing env for player 4, init_info: {'port': 40901}... -[2023-09-12 18:21:51,059][130142] Initializing env for player 5, init_info: {'port': 40901}... -[2023-09-12 18:21:51,071][130106] Multi agent env, num agents: 8 -[2023-09-12 18:21:51,101][130106] Multi agent env, num agents: 8 -[2023-09-12 18:21:51,110][130142] Initializing env for player 6, init_info: {'port': 40901}... -[2023-09-12 18:21:51,138][130141] Initialized w:3 v:1 player:7 -[2023-09-12 18:21:51,139][130141] Initialized w:3 v:1 player:5 -[2023-09-12 18:21:51,139][130141] Initialized w:3 v:1 player:3 -[2023-09-12 18:21:51,139][130141] Initialized w:3 v:1 player:0 -[2023-09-12 18:21:51,139][130141] Initialized w:3 v:1 player:4 -[2023-09-12 18:21:51,140][130141] Initialized w:3 v:1 player:6 -[2023-09-12 18:21:51,140][130141] Initialized w:3 v:1 player:1 -[2023-09-12 18:21:51,140][130141] Initialized w:3 v:1 player:2 -[2023-09-12 18:21:51,142][130141] 8 agent workers initialized for env 3! -[2023-09-12 18:21:51,160][130142] Initializing env for player 7, init_info: {'port': 40901}... -[2023-09-12 18:21:51,164][130106] Port 40402 is available -[2023-09-12 18:21:51,164][130106] Using port 40402 -[2023-09-12 18:21:51,174][130141] Decorrelating experience for 32 frames... -[2023-09-12 18:21:51,376][130143] Initialized w:7 v:2 player:2 -[2023-09-12 18:21:51,377][130143] Initialized w:7 v:2 player:6 -[2023-09-12 18:21:51,377][130143] Initialized w:7 v:2 player:5 -[2023-09-12 18:21:51,378][130143] Initialized w:7 v:2 player:3 -[2023-09-12 18:21:51,378][130143] Initialized w:7 v:2 player:4 -[2023-09-12 18:21:51,378][130143] Initialized w:7 v:2 player:0 -[2023-09-12 18:21:51,378][130143] Initialized w:7 v:2 player:7 -[2023-09-12 18:21:51,381][130143] Initialized w:7 v:2 player:1 -[2023-09-12 18:21:51,383][130143] 8 agent workers initialized for env 7! -[2023-09-12 18:21:51,399][130107] Initialized w:2 v:2 player:4 -[2023-09-12 18:21:51,401][130107] Initialized w:2 v:2 player:6 -[2023-09-12 18:21:51,401][130107] Initialized w:2 v:2 player:1 -[2023-09-12 18:21:51,401][130107] Initialized w:2 v:2 player:5 -[2023-09-12 18:21:51,401][130107] Initialized w:2 v:2 player:0 -[2023-09-12 18:21:51,401][130107] Initialized w:2 v:2 player:2 -[2023-09-12 18:21:51,401][130107] Initialized w:2 v:2 player:7 -[2023-09-12 18:21:51,402][130107] Initialized w:2 v:2 player:3 -[2023-09-12 18:21:51,405][130107] 8 agent workers initialized for env 2! -[2023-09-12 18:21:51,423][130143] Decorrelating experience for 64 frames... -[2023-09-12 18:21:51,443][130108] Initialized w:5 v:2 player:6 -[2023-09-12 18:21:51,445][130108] Initialized w:5 v:2 player:1 -[2023-09-12 18:21:51,446][130108] Initialized w:5 v:2 player:4 -[2023-09-12 18:21:51,446][130108] Initialized w:5 v:2 player:5 -[2023-09-12 18:21:51,447][130108] Initialized w:5 v:2 player:2 -[2023-09-12 18:21:51,448][130108] Initialized w:5 v:2 player:7 -[2023-09-12 18:21:51,448][130108] Initialized w:5 v:2 player:0 -[2023-09-12 18:21:51,448][130108] Initialized w:5 v:2 player:3 -[2023-09-12 18:21:51,450][130108] 8 agent workers initialized for env 5! -[2023-09-12 18:21:51,453][130107] Decorrelating experience for 64 frames... -[2023-09-12 18:21:51,517][130109] Initialized w:4 v:2 player:3 -[2023-09-12 18:21:51,519][130109] Initialized w:4 v:2 player:1 -[2023-09-12 18:21:51,519][130109] Initialized w:4 v:2 player:0 -[2023-09-12 18:21:51,519][130109] Initialized w:4 v:2 player:5 -[2023-09-12 18:21:51,520][130109] Initialized w:4 v:2 player:7 -[2023-09-12 18:21:51,520][130109] Initialized w:4 v:2 player:6 -[2023-09-12 18:21:51,520][130109] Initialized w:4 v:2 player:4 -[2023-09-12 18:21:51,521][130109] Initialized w:4 v:2 player:2 -[2023-09-12 18:21:51,522][130108] Decorrelating experience for 64 frames... -[2023-09-12 18:21:51,523][130109] 8 agent workers initialized for env 4! -[2023-09-12 18:21:51,528][130072] Initialized w:0 v:2 player:2 -[2023-09-12 18:21:51,530][130072] Initialized w:0 v:2 player:0 -[2023-09-12 18:21:51,531][130072] Initialized w:0 v:2 player:1 -[2023-09-12 18:21:51,531][130072] Initialized w:0 v:2 player:3 -[2023-09-12 18:21:51,531][130072] Initialized w:0 v:2 player:5 -[2023-09-12 18:21:51,531][130072] Initialized w:0 v:2 player:7 -[2023-09-12 18:21:51,531][130072] Initialized w:0 v:2 player:6 -[2023-09-12 18:21:51,532][130072] Initialized w:0 v:2 player:4 -[2023-09-12 18:21:51,536][130072] 8 agent workers initialized for env 0! -[2023-09-12 18:21:51,560][130109] Decorrelating experience for 64 frames... -[2023-09-12 18:21:51,603][130141] Multi agent env, num agents: 8 -[2023-09-12 18:21:51,612][130072] Decorrelating experience for 64 frames... -[2023-09-12 18:21:51,642][130141] Multi agent env, num agents: 8 -[2023-09-12 18:21:51,681][130141] Port 40602 is available -[2023-09-12 18:21:51,681][130141] Using port 40602 -[2023-09-12 18:21:51,681][130141] Initializing env for player 0, init_info: {'port': 40602}... -[2023-09-12 18:21:51,716][130141] Using port 40602 on host... -[2023-09-12 18:21:51,732][130141] Initializing env for player 1, init_info: {'port': 40602}... -[2023-09-12 18:21:51,782][130141] Initializing env for player 2, init_info: {'port': 40602}... -[2023-09-12 18:21:51,847][130141] Initializing env for player 3, init_info: {'port': 40602}... -[2023-09-12 18:21:51,903][130141] Initializing env for player 4, init_info: {'port': 40602}... -[2023-09-12 18:21:51,955][130141] Initializing env for player 5, init_info: {'port': 40602}... -[2023-09-12 18:21:52,011][130141] Initializing env for player 6, init_info: {'port': 40602}... -[2023-09-12 18:21:52,063][130141] Initializing env for player 7, init_info: {'port': 40602}... -[2023-09-12 18:21:52,160][130143] Port 41003 is available -[2023-09-12 18:21:52,160][130143] Using port 41003 -[2023-09-12 18:21:52,161][130143] Initializing env for player 0, init_info: {'port': 41003}... -[2023-09-12 18:21:52,169][130107] Port 40503 is available -[2023-09-12 18:21:52,169][130107] Using port 40503 -[2023-09-12 18:21:52,170][130107] Initializing env for player 0, init_info: {'port': 40503}... -[2023-09-12 18:21:52,199][130107] Using port 40503 on host... -[2023-09-12 18:21:52,205][130143] Using port 41003 on host... -[2023-09-12 18:21:52,220][130143] Initializing env for player 1, init_info: {'port': 41003}... -[2023-09-12 18:21:52,220][130107] Initializing env for player 1, init_info: {'port': 40503}... -[2023-09-12 18:21:52,272][130107] Initializing env for player 2, init_info: {'port': 40503}... -[2023-09-12 18:21:52,287][130143] Initializing env for player 2, init_info: {'port': 41003}... -[2023-09-12 18:21:52,324][130107] Initializing env for player 3, init_info: {'port': 40503}... -[2023-09-12 18:21:52,338][130143] Initializing env for player 3, init_info: {'port': 41003}... -[2023-09-12 18:21:52,377][130107] Initializing env for player 4, init_info: {'port': 40503}... -[2023-09-12 18:21:52,385][130142] Initialized w:6 v:1 player:5 -[2023-09-12 18:21:52,385][130142] Initialized w:6 v:1 player:3 -[2023-09-12 18:21:52,387][130142] Initialized w:6 v:1 player:6 -[2023-09-12 18:21:52,388][130142] Initialized w:6 v:1 player:7 -[2023-09-12 18:21:52,388][130142] Initialized w:6 v:1 player:4 -[2023-09-12 18:21:52,388][130142] Initialized w:6 v:1 player:1 -[2023-09-12 18:21:52,389][130142] Initialized w:6 v:1 player:0 -[2023-09-12 18:21:52,390][130142] Initialized w:6 v:1 player:2 -[2023-09-12 18:21:52,391][130142] 8 agent workers initialized for env 6! -[2023-09-12 18:21:52,397][130143] Initializing env for player 4, init_info: {'port': 41003}... -[2023-09-12 18:21:52,426][130072] Port 40303 is available -[2023-09-12 18:21:52,426][130072] Using port 40303 -[2023-09-12 18:21:52,427][130072] Initializing env for player 0, init_info: {'port': 40303}... -[2023-09-12 18:21:52,428][130108] Port 40803 is available -[2023-09-12 18:21:52,428][130108] Using port 40803 -[2023-09-12 18:21:52,428][130108] Initializing env for player 0, init_info: {'port': 40803}... -[2023-09-12 18:21:52,431][130107] Initializing env for player 5, init_info: {'port': 40503}... -[2023-09-12 18:21:52,433][130142] Decorrelating experience for 32 frames... -[2023-09-12 18:21:52,433][130106] Initializing env for player 0, init_info: {'port': 40402}... -[2023-09-12 18:21:52,447][130143] Initializing env for player 5, init_info: {'port': 41003}... -[2023-09-12 18:21:52,463][130106] Using port 40402 on host... -[2023-09-12 18:21:52,465][130072] Using port 40303 on host... -[2023-09-12 18:21:52,470][130108] Using port 40803 on host... -[2023-09-12 18:21:52,478][130072] Initializing env for player 1, init_info: {'port': 40303}... -[2023-09-12 18:21:52,480][130108] Initializing env for player 1, init_info: {'port': 40803}... -[2023-09-12 18:21:52,483][130107] Initializing env for player 6, init_info: {'port': 40503}... -[2023-09-12 18:21:52,484][130106] Initializing env for player 1, init_info: {'port': 40402}... -[2023-09-12 18:21:52,499][130143] Initializing env for player 6, init_info: {'port': 41003}... -[2023-09-12 18:21:52,501][130109] Port 40703 is available -[2023-09-12 18:21:52,502][130109] Using port 40703 -[2023-09-12 18:21:52,502][130109] Initializing env for player 0, init_info: {'port': 40703}... -[2023-09-12 18:21:52,528][130072] Initializing env for player 2, init_info: {'port': 40303}... -[2023-09-12 18:21:52,531][130108] Initializing env for player 2, init_info: {'port': 40803}... -[2023-09-12 18:21:52,532][130109] Using port 40703 on host... -[2023-09-12 18:21:52,534][130106] Initializing env for player 2, init_info: {'port': 40402}... -[2023-09-12 18:21:52,535][130107] Initializing env for player 7, init_info: {'port': 40503}... -[2023-09-12 18:21:52,553][130109] Initializing env for player 1, init_info: {'port': 40703}... -[2023-09-12 18:21:52,579][130143] Initializing env for player 7, init_info: {'port': 41003}... -[2023-09-12 18:21:52,581][130108] Initializing env for player 3, init_info: {'port': 40803}... -[2023-09-12 18:21:52,585][130106] Initializing env for player 3, init_info: {'port': 40402}... -[2023-09-12 18:21:52,578][130072] Initializing env for player 3, init_info: {'port': 40303}... -[2023-09-12 18:21:52,603][130109] Initializing env for player 2, init_info: {'port': 40703}... -[2023-09-12 18:21:52,631][130072] Initializing env for player 4, init_info: {'port': 40303}... -[2023-09-12 18:21:52,635][130108] Initializing env for player 4, init_info: {'port': 40803}... -[2023-09-12 18:21:52,647][130106] Initializing env for player 4, init_info: {'port': 40402}... -[2023-09-12 18:21:52,667][130109] Initializing env for player 3, init_info: {'port': 40703}... -[2023-09-12 18:21:52,681][130072] Initializing env for player 5, init_info: {'port': 40303}... -[2023-09-12 18:21:52,696][130106] Initializing env for player 5, init_info: {'port': 40402}... -[2023-09-12 18:21:52,715][130108] Initializing env for player 5, init_info: {'port': 40803}... -[2023-09-12 18:21:52,719][130109] Initializing env for player 4, init_info: {'port': 40703}... -[2023-09-12 18:21:52,734][130072] Initializing env for player 6, init_info: {'port': 40303}... -[2023-09-12 18:21:52,760][130106] Initializing env for player 6, init_info: {'port': 40402}... -[2023-09-12 18:21:52,772][130108] Initializing env for player 6, init_info: {'port': 40803}... -[2023-09-12 18:21:52,785][130072] Initializing env for player 7, init_info: {'port': 40303}... -[2023-09-12 18:21:52,811][130109] Initializing env for player 5, init_info: {'port': 40703}... -[2023-09-12 18:21:52,821][130108] Initializing env for player 7, init_info: {'port': 40803}... -[2023-09-12 18:21:52,827][130106] Initializing env for player 7, init_info: {'port': 40402}... -[2023-09-12 18:21:52,862][130109] Initializing env for player 6, init_info: {'port': 40703}... -[2023-09-12 18:21:52,888][130142] Multi agent env, num agents: 8 -[2023-09-12 18:21:52,912][130109] Initializing env for player 7, init_info: {'port': 40703}... -[2023-09-12 18:21:52,936][130142] Multi agent env, num agents: 8 -[2023-09-12 18:21:52,981][130142] Port 40902 is available -[2023-09-12 18:21:52,981][130142] Using port 40902 -[2023-09-12 18:21:53,438][130141] Initialized w:3 v:2 player:6 -[2023-09-12 18:21:53,441][130141] Initialized w:3 v:2 player:0 -[2023-09-12 18:21:53,441][130141] Initialized w:3 v:2 player:1 -[2023-09-12 18:21:53,441][130141] Initialized w:3 v:2 player:7 -[2023-09-12 18:21:53,442][130141] Initialized w:3 v:2 player:3 -[2023-09-12 18:21:53,442][130141] Initialized w:3 v:2 player:2 -[2023-09-12 18:21:53,442][130141] Initialized w:3 v:2 player:4 -[2023-09-12 18:21:53,442][130141] Initialized w:3 v:2 player:5 -[2023-09-12 18:21:53,445][130141] 8 agent workers initialized for env 3! -[2023-09-12 18:21:53,488][130141] Decorrelating experience for 64 frames... -[2023-09-12 18:21:53,969][130107] Initialized w:2 v:3 player:1 -[2023-09-12 18:21:53,971][130107] Initialized w:2 v:3 player:2 -[2023-09-12 18:21:53,971][130107] Initialized w:2 v:3 player:3 -[2023-09-12 18:21:53,971][130107] Initialized w:2 v:3 player:6 -[2023-09-12 18:21:53,971][130107] Initialized w:2 v:3 player:4 -[2023-09-12 18:21:53,972][130107] Initialized w:2 v:3 player:0 -[2023-09-12 18:21:53,972][130107] Initialized w:2 v:3 player:7 -[2023-09-12 18:21:53,972][130107] Initialized w:2 v:3 player:5 -[2023-09-12 18:21:53,974][130107] 8 agent workers initialized for env 2! -[2023-09-12 18:21:53,989][130143] Initialized w:7 v:3 player:7 -[2023-09-12 18:21:53,990][130143] Initialized w:7 v:3 player:0 -[2023-09-12 18:21:53,991][130143] Initialized w:7 v:3 player:6 -[2023-09-12 18:21:53,991][130143] Initialized w:7 v:3 player:4 -[2023-09-12 18:21:53,992][130143] Initialized w:7 v:3 player:1 -[2023-09-12 18:21:53,992][130143] Initialized w:7 v:3 player:2 -[2023-09-12 18:21:53,992][130143] Initialized w:7 v:3 player:5 -[2023-09-12 18:21:53,994][130143] Initialized w:7 v:3 player:3 -[2023-09-12 18:21:53,995][130143] 8 agent workers initialized for env 7! -[2023-09-12 18:21:53,999][130107] Decorrelating experience for 96 frames... -[2023-09-12 18:21:54,068][130141] Port 40603 is available -[2023-09-12 18:21:54,068][130141] Using port 40603 -[2023-09-12 18:21:54,078][130143] Decorrelating experience for 96 frames... -[2023-09-12 18:21:54,343][130106] Initialized w:1 v:2 player:4 -[2023-09-12 18:21:54,347][130106] Initialized w:1 v:2 player:1 -[2023-09-12 18:21:54,348][130106] Initialized w:1 v:2 player:5 -[2023-09-12 18:21:54,348][130106] Initialized w:1 v:2 player:6 -[2023-09-12 18:21:54,348][130106] Initialized w:1 v:2 player:2 -[2023-09-12 18:21:54,349][130106] Initialized w:1 v:2 player:7 -[2023-09-12 18:21:54,349][130106] Initialized w:1 v:2 player:0 -[2023-09-12 18:21:54,358][130106] Initialized w:1 v:2 player:3 -[2023-09-12 18:21:54,359][130106] 8 agent workers initialized for env 1! -[2023-09-12 18:21:54,361][130072] Initialized w:0 v:3 player:6 -[2023-09-12 18:21:54,364][130072] Initialized w:0 v:3 player:0 -[2023-09-12 18:21:54,364][130072] Initialized w:0 v:3 player:4 -[2023-09-12 18:21:54,365][130072] Initialized w:0 v:3 player:5 -[2023-09-12 18:21:54,367][130072] Initialized w:0 v:3 player:1 -[2023-09-12 18:21:54,370][130072] Initialized w:0 v:3 player:7 -[2023-09-12 18:21:54,371][130072] Initialized w:0 v:3 player:2 -[2023-09-12 18:21:54,391][130108] Initialized w:5 v:3 player:6 -[2023-09-12 18:21:54,392][130108] Initialized w:5 v:3 player:7 -[2023-09-12 18:21:54,392][130108] Initialized w:5 v:3 player:3 -[2023-09-12 18:21:54,392][130108] Initialized w:5 v:3 player:1 -[2023-09-12 18:21:54,392][130108] Initialized w:5 v:3 player:4 -[2023-09-12 18:21:54,392][130108] Initialized w:5 v:3 player:0 -[2023-09-12 18:21:54,392][130108] Initialized w:5 v:3 player:2 -[2023-09-12 18:21:54,393][130108] Initialized w:5 v:3 player:5 -[2023-09-12 18:21:54,396][130142] Initializing env for player 0, init_info: {'port': 40902}... -[2023-09-12 18:21:54,396][130108] 8 agent workers initialized for env 5! -[2023-09-12 18:21:54,400][130106] Decorrelating experience for 64 frames... -[2023-09-12 18:21:54,409][130109] Initialized w:4 v:3 player:7 -[2023-09-12 18:21:54,410][130109] Initialized w:4 v:3 player:6 -[2023-09-12 18:21:54,411][130109] Initialized w:4 v:3 player:5 -[2023-09-12 18:21:54,412][130109] Initialized w:4 v:3 player:4 -[2023-09-12 18:21:54,412][130109] Initialized w:4 v:3 player:0 -[2023-09-12 18:21:54,413][130109] Initialized w:4 v:3 player:1 -[2023-09-12 18:21:54,414][130109] Initialized w:4 v:3 player:3 -[2023-09-12 18:21:54,414][130109] Initialized w:4 v:3 player:2 -[2023-09-12 18:21:54,415][130109] 8 agent workers initialized for env 4! -[2023-09-12 18:21:54,424][130141] Initializing env for player 0, init_info: {'port': 40603}... -[2023-09-12 18:21:54,430][130142] Using port 40902 on host... -[2023-09-12 18:21:54,433][130108] Decorrelating experience for 96 frames... -[2023-09-12 18:21:54,447][130142] Initializing env for player 1, init_info: {'port': 40902}... -[2023-09-12 18:21:54,448][130109] Decorrelating experience for 96 frames... -[2023-09-12 18:21:54,467][130141] Using port 40603 on host... -[2023-09-12 18:21:54,480][130141] Initializing env for player 1, init_info: {'port': 40603}... -[2023-09-12 18:21:54,497][130142] Initializing env for player 2, init_info: {'port': 40902}... -[2023-09-12 18:21:54,530][130141] Initializing env for player 2, init_info: {'port': 40603}... -[2023-09-12 18:21:54,548][130142] Initializing env for player 3, init_info: {'port': 40902}... -[2023-09-12 18:21:54,591][130141] Initializing env for player 3, init_info: {'port': 40603}... -[2023-09-12 18:21:54,598][130142] Initializing env for player 4, init_info: {'port': 40902}... -[2023-09-12 18:21:54,638][130141] Initializing env for player 4, init_info: {'port': 40603}... -[2023-09-12 18:21:54,649][130142] Initializing env for player 5, init_info: {'port': 40902}... -[2023-09-12 18:21:54,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:21:54,688][130141] Initializing env for player 5, init_info: {'port': 40603}... -[2023-09-12 18:21:54,711][130142] Initializing env for player 6, init_info: {'port': 40902}... -[2023-09-12 18:21:54,751][130141] Initializing env for player 6, init_info: {'port': 40603}... -[2023-09-12 18:21:54,776][130142] Initializing env for player 7, init_info: {'port': 40902}... -[2023-09-12 18:21:54,819][130141] Initializing env for player 7, init_info: {'port': 40603}... -[2023-09-12 18:21:55,469][130106] Port 40403 is available -[2023-09-12 18:21:55,470][130106] Using port 40403 -[2023-09-12 18:21:55,470][130106] Initializing env for player 0, init_info: {'port': 40403}... -[2023-09-12 18:21:55,506][130106] Using port 40403 on host... -[2023-09-12 18:21:55,521][130106] Initializing env for player 1, init_info: {'port': 40403}... -[2023-09-12 18:21:55,573][130106] Initializing env for player 2, init_info: {'port': 40403}... -[2023-09-12 18:21:55,627][130106] Initializing env for player 3, init_info: {'port': 40403}... -[2023-09-12 18:21:55,695][130106] Initializing env for player 4, init_info: {'port': 40403}... -[2023-09-12 18:21:55,735][130106] Initializing env for player 5, init_info: {'port': 40403}... -[2023-09-12 18:21:55,815][130106] Initializing env for player 6, init_info: {'port': 40403}... -[2023-09-12 18:21:55,866][130106] Initializing env for player 7, init_info: {'port': 40403}... -[2023-09-12 18:21:56,217][130142] Initialized w:6 v:2 player:0 -[2023-09-12 18:21:56,219][130142] Initialized w:6 v:2 player:2 -[2023-09-12 18:21:56,220][130142] Initialized w:6 v:2 player:6 -[2023-09-12 18:21:56,221][130142] Initialized w:6 v:2 player:3 -[2023-09-12 18:21:56,222][130142] Initialized w:6 v:2 player:4 -[2023-09-12 18:21:56,224][130142] Initialized w:6 v:2 player:7 -[2023-09-12 18:21:56,224][130142] Initialized w:6 v:2 player:1 -[2023-09-12 18:21:56,224][130142] Initialized w:6 v:2 player:5 -[2023-09-12 18:21:56,225][130142] 8 agent workers initialized for env 6! -[2023-09-12 18:21:56,231][130141] Initialized w:3 v:3 player:2 -[2023-09-12 18:21:56,231][130141] Initialized w:3 v:3 player:4 -[2023-09-12 18:21:56,232][130141] Initialized w:3 v:3 player:6 -[2023-09-12 18:21:56,232][130141] Initialized w:3 v:3 player:7 -[2023-09-12 18:21:56,232][130141] Initialized w:3 v:3 player:5 -[2023-09-12 18:21:56,232][130141] Initialized w:3 v:3 player:0 -[2023-09-12 18:21:56,233][130141] Initialized w:3 v:3 player:1 -[2023-09-12 18:21:56,233][130141] Initialized w:3 v:3 player:3 -[2023-09-12 18:21:56,234][130141] 8 agent workers initialized for env 3! -[2023-09-12 18:21:56,263][130142] Decorrelating experience for 64 frames... -[2023-09-12 18:21:56,287][130141] Decorrelating experience for 96 frames... -[2023-09-12 18:21:57,023][130142] Port 40903 is available -[2023-09-12 18:21:57,023][130142] Using port 40903 -[2023-09-12 18:21:57,024][130142] Initializing env for player 0, init_info: {'port': 40903}... -[2023-09-12 18:21:57,056][130142] Using port 40903 on host... -[2023-09-12 18:21:57,074][130142] Initializing env for player 1, init_info: {'port': 40903}... -[2023-09-12 18:21:57,130][130142] Initializing env for player 2, init_info: {'port': 40903}... -[2023-09-12 18:21:57,163][130106] Initialized w:1 v:3 player:4 -[2023-09-12 18:21:57,163][130106] Initialized w:1 v:3 player:5 -[2023-09-12 18:21:57,164][130106] Initialized w:1 v:3 player:3 -[2023-09-12 18:21:57,166][130106] Initialized w:1 v:3 player:0 -[2023-09-12 18:21:57,166][130106] Initialized w:1 v:3 player:1 -[2023-09-12 18:21:57,166][130106] Initialized w:1 v:3 player:2 -[2023-09-12 18:21:57,167][130106] Initialized w:1 v:3 player:6 -[2023-09-12 18:21:57,168][130106] Initialized w:1 v:3 player:7 -[2023-09-12 18:21:57,169][130106] 8 agent workers initialized for env 1! -[2023-09-12 18:21:57,180][130142] Initializing env for player 3, init_info: {'port': 40903}... -[2023-09-12 18:21:57,209][130106] Decorrelating experience for 96 frames... -[2023-09-12 18:21:57,243][130142] Initializing env for player 4, init_info: {'port': 40903}... -[2023-09-12 18:21:57,291][130142] Initializing env for player 5, init_info: {'port': 40903}... -[2023-09-12 18:21:57,347][130142] Initializing env for player 6, init_info: {'port': 40903}... -[2023-09-12 18:21:57,395][130142] Initializing env for player 7, init_info: {'port': 40903}... -[2023-09-12 18:21:58,410][129907] Signal inference workers to stop experience collection... -[2023-09-12 18:21:58,430][130071] InferenceWorker_p0-w0: stopping experience collection -[2023-09-12 18:21:58,949][130142] Initialized w:6 v:3 player:4 -[2023-09-12 18:21:58,950][130142] Initialized w:6 v:3 player:6 -[2023-09-12 18:21:58,951][130142] Initialized w:6 v:3 player:0 -[2023-09-12 18:21:58,951][130142] Initialized w:6 v:3 player:3 -[2023-09-12 18:21:58,952][130142] Initialized w:6 v:3 player:1 -[2023-09-12 18:21:58,951][130142] Initialized w:6 v:3 player:5 -[2023-09-12 18:21:58,951][130142] Initialized w:6 v:3 player:2 -[2023-09-12 18:21:58,952][130142] Initialized w:6 v:3 player:7 -[2023-09-12 18:21:58,953][130142] 8 agent workers initialized for env 6! -[2023-09-12 18:21:59,000][130142] Decorrelating experience for 96 frames... -[2023-09-12 18:21:59,376][129907] EvtLoop [learner_proc0_evt_loop, process=learner_proc0] unhandled exception in slot='on_new_training_batch' connected to emitter=Emitter(object_id='Batcher_0', signal_name='training_batches_available'), args=(0,) -Traceback (most recent call last): - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py", line 355, in _process_signal - slot_callable(*args) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner_worker.py", line 150, in on_new_training_batch - stats = self.learner.train(self.batcher.training_batches[batch_idx]) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 1046, in train - train_stats = self._train(buff, self.cfg.batch_size, experience_size, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 731, in _train - ) = self._calculate_losses(mb, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 649, in _calculate_losses - exploration_loss = self.exploration_loss_func(action_distribution, valids, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 477, in _symmetric_kl_exploration_loss - kl_prior = action_distribution.symmetric_kl_with_uniform_prior() - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py", line 247, in symmetric_kl_with_uniform_prior - sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions] - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py", line 247, in - sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions] -AttributeError: 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' -[2023-09-12 18:21:59,377][129907] Unhandled exception 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' in evt loop learner_proc0_evt_loop -[2023-09-12 18:21:59,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 123.7. Samples: 1856. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:22:00,070][129210] Heartbeat connected on Batcher_0 -[2023-09-12 18:22:00,077][129210] Heartbeat connected on InferenceWorker_p0-w0 -[2023-09-12 18:22:00,085][129210] Heartbeat connected on RolloutWorker_w1 -[2023-09-12 18:22:00,088][129210] Heartbeat connected on RolloutWorker_w2 -[2023-09-12 18:22:00,091][129210] Heartbeat connected on RolloutWorker_w3 -[2023-09-12 18:22:00,094][129210] Heartbeat connected on RolloutWorker_w4 -[2023-09-12 18:22:00,097][129210] Heartbeat connected on RolloutWorker_w5 -[2023-09-12 18:22:00,100][129210] Heartbeat connected on RolloutWorker_w6 -[2023-09-12 18:22:00,103][129210] Heartbeat connected on RolloutWorker_w7 -[2023-09-12 18:22:04,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 225.6. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:22:09,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 180.5. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:22:14,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 150.4. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:22:19,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 128.9. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:22:24,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 112.8. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:22:29,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 100.3. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:22:34,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 100.3. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:22:39,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 100.3. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:22:44,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 59.0. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:22:49,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:22:54,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:22:59,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:23:04,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:23:09,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:23:14,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:23:19,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:23:24,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:23:29,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:23:34,655][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 4512. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:23:38,652][130072] VizDoom game.init() threw an exception SignalException('Signal SIGINT received. ViZDoom instance has been closed.'). Terminate process... -[2023-09-12 18:23:38,653][129210] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 129210], exiting... -[2023-09-12 18:23:38,655][130072] Failed with error RuntimeError('Critical error: worker stuck on initialization. Abort! '), trying again -[2023-09-12 18:23:38,656][129907] Stopping Batcher_0... -[2023-09-12 18:23:38,657][129907] Loop batcher_evt_loop terminating... -[2023-09-12 18:23:38,656][129210] Runner profile tree view: -main_loop: 118.5532 -[2023-09-12 18:23:38,658][129210] Collected {0: 0}, FPS: 0.0 -[2023-09-12 18:23:38,672][130071] Weights refcount: 2 0 -[2023-09-12 18:23:38,673][130071] Stopping InferenceWorker_p0-w0... -[2023-09-12 18:23:38,673][130071] Loop inference_proc0-0_evt_loop terminating... -[2023-09-12 18:23:38,819][129210] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json -[2023-09-12 18:23:38,820][129210] Overriding arg 'num_workers' with value 1 passed from command line -[2023-09-12 18:23:38,821][129210] Adding new argument 'no_render'=True that is not in the saved config file! -[2023-09-12 18:23:38,821][129210] Adding new argument 'save_video'=True that is not in the saved config file! -[2023-09-12 18:23:38,822][129210] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file! -[2023-09-12 18:23:38,822][129210] Adding new argument 'video_name'=None that is not in the saved config file! -[2023-09-12 18:23:38,824][129210] Adding new argument 'max_num_frames'=1000000000.0 that is not in the saved config file! -[2023-09-12 18:23:38,825][129210] Adding new argument 'max_num_episodes'=10 that is not in the saved config file! -[2023-09-12 18:23:38,825][129210] Adding new argument 'push_to_hub'=False that is not in the saved config file! -[2023-09-12 18:23:38,826][129210] Adding new argument 'hf_repository'=None that is not in the saved config file! -[2023-09-12 18:23:38,827][129210] Adding new argument 'policy_index'=0 that is not in the saved config file! -[2023-09-12 18:23:38,828][129210] Adding new argument 'eval_deterministic'=False that is not in the saved config file! -[2023-09-12 18:23:38,829][129210] Adding new argument 'train_script'=None that is not in the saved config file! -[2023-09-12 18:23:38,830][129210] Adding new argument 'enjoy_script'=None that is not in the saved config file! -[2023-09-12 18:23:38,831][129210] Using frameskip 1 and render_action_repeat=4 for evaluation -[2023-09-12 18:23:38,834][129210] Multi agent env, num agents: 8 -[2023-09-12 18:23:38,879][129210] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:23:38,884][129210] RunningMeanStd input shape: (23,) -[2023-09-12 18:23:38,886][129210] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 18:23:38,887][129210] RunningMeanStd input shape: (1,) -[2023-09-12 18:23:38,907][129210] ConvEncoder: input_channels=3 -[2023-09-12 18:23:39,115][129210] Conv encoder output size: 512 -[2023-09-12 18:23:39,118][129210] Policy head output size: 640 -[2023-09-12 18:23:39,662][130072] Port 40303 is available -[2023-09-12 18:23:39,662][130072] Using port 40303 -[2023-09-12 18:23:39,663][130072] Initializing env for player 0, init_info: {'port': 40303}... -[2023-09-12 18:23:39,694][130072] Using port 40303 on host... -[2023-09-12 18:23:39,714][130072] Initializing env for player 1, init_info: {'port': 40303}... -[2023-09-12 18:23:39,764][130072] Initializing env for player 2, init_info: {'port': 40303}... -[2023-09-12 18:23:39,814][130072] Initializing env for player 3, init_info: {'port': 40303}... -[2023-09-12 18:23:39,879][130072] Initializing env for player 4, init_info: {'port': 40303}... -[2023-09-12 18:23:39,935][130072] Initializing env for player 5, init_info: {'port': 40303}... -[2023-09-12 18:23:39,983][130072] Initializing env for player 6, init_info: {'port': 40303}... -[2023-09-12 18:23:40,075][130072] Initializing env for player 7, init_info: {'port': 40303}... -[2023-09-12 18:23:40,305][129210] No checkpoints found -[2023-09-12 18:23:41,345][130072] Initialized w:0 v:3 player:6 -[2023-09-12 18:23:41,347][130072] Initialized w:0 v:3 player:2 -[2023-09-12 18:23:41,347][130072] Initialized w:0 v:3 player:5 -[2023-09-12 18:23:41,349][130072] Initialized w:0 v:3 player:4 -[2023-09-12 18:23:41,349][130072] Initialized w:0 v:3 player:1 -[2023-09-12 18:23:41,349][130072] Initialized w:0 v:3 player:3 -[2023-09-12 18:23:41,350][130072] Initialized w:0 v:3 player:0 -[2023-09-12 18:23:41,876][130109] Stopping RolloutWorker_w4... -[2023-09-12 18:23:41,876][130109] Loop rollout_proc4_evt_loop terminating... -[2023-09-12 18:23:41,879][130141] Stopping RolloutWorker_w3... -[2023-09-12 18:23:41,880][130141] Loop rollout_proc3_evt_loop terminating... -[2023-09-12 18:23:41,887][130106] Stopping RolloutWorker_w1... -[2023-09-12 18:23:41,888][130106] Loop rollout_proc1_evt_loop terminating... -[2023-09-12 18:23:41,890][130143] Stopping RolloutWorker_w7... -[2023-09-12 18:23:41,890][130143] Loop rollout_proc7_evt_loop terminating... -[2023-09-12 18:23:41,903][130107] Stopping RolloutWorker_w2... -[2023-09-12 18:23:41,904][130107] Loop rollout_proc2_evt_loop terminating... -[2023-09-12 18:23:41,945][130108] Stopping RolloutWorker_w5... -[2023-09-12 18:23:41,945][130108] Loop rollout_proc5_evt_loop terminating... -[2023-09-12 18:23:41,970][130142] Stopping RolloutWorker_w6... -[2023-09-12 18:23:41,971][130142] Loop rollout_proc6_evt_loop terminating... -[2023-09-12 18:23:42,345][130072] Initialized w:0 v:3 player:7 -[2023-09-12 18:23:42,346][130072] 8 agent workers initialized for env 0! -[2023-09-12 18:23:42,394][130072] Decorrelating experience for 96 frames... -[2023-09-12 18:23:46,477][130072] Stopping RolloutWorker_w0... -[2023-09-12 18:23:46,478][130072] Loop rollout_proc0_evt_loop terminating... -[2023-09-12 18:24:12,661][129210] Environment doom_basic already registered, overwriting... -[2023-09-12 18:24:12,664][129210] Environment doom_two_colors_easy already registered, overwriting... -[2023-09-12 18:24:12,665][129210] Environment doom_two_colors_hard already registered, overwriting... -[2023-09-12 18:24:12,666][129210] Environment doom_dm already registered, overwriting... -[2023-09-12 18:24:12,667][129210] Environment doom_dwango5 already registered, overwriting... -[2023-09-12 18:24:12,668][129210] Environment doom_my_way_home_flat_actions already registered, overwriting... -[2023-09-12 18:24:12,669][129210] Environment doom_defend_the_center_flat_actions already registered, overwriting... -[2023-09-12 18:24:12,670][129210] Environment doom_my_way_home already registered, overwriting... -[2023-09-12 18:24:12,673][129210] Environment doom_deadly_corridor already registered, overwriting... -[2023-09-12 18:24:12,674][129210] Environment doom_defend_the_center already registered, overwriting... -[2023-09-12 18:24:12,675][129210] Environment doom_defend_the_line already registered, overwriting... -[2023-09-12 18:24:12,676][129210] Environment doom_health_gathering already registered, overwriting... -[2023-09-12 18:24:12,677][129210] Environment doom_health_gathering_supreme already registered, overwriting... -[2023-09-12 18:24:12,678][129210] Environment doom_battle already registered, overwriting... -[2023-09-12 18:24:12,679][129210] Environment doom_battle2 already registered, overwriting... -[2023-09-12 18:24:12,680][129210] Environment doom_duel_bots already registered, overwriting... -[2023-09-12 18:24:12,681][129210] Environment doom_deathmatch_bots already registered, overwriting... -[2023-09-12 18:24:12,681][129210] Environment doom_duel already registered, overwriting... -[2023-09-12 18:24:12,682][129210] Environment doom_deathmatch_full already registered, overwriting... -[2023-09-12 18:24:12,683][129210] Environment doom_benchmark already registered, overwriting... -[2023-09-12 18:24:12,684][129210] register_encoder_factory: -[2023-09-12 18:24:12,706][129210] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json -[2023-09-12 18:24:12,707][129210] Overriding arg 'env' with value 'doom_dwango5' passed from command line -[2023-09-12 18:24:12,712][129210] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists! -[2023-09-12 18:24:12,713][129210] Resuming existing experiment from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment... -[2023-09-12 18:24:12,713][129210] Weights and Biases integration disabled -[2023-09-12 18:24:12,716][129210] Environment var CUDA_VISIBLE_DEVICES is 0,1 - -[2023-09-12 18:24:14,817][129210] Starting experiment with the following configuration: -help=False -algo=APPO -env=doom_dwango5 -experiment=default_experiment -train_dir=/home/cogstack/Documents/optuna/environments/sample_factory/train_dir -restart_behavior=resume -device=gpu -seed=None -num_policies=1 -async_rl=True -serial_mode=False -batched_sampling=False -num_batches_to_accumulate=2 -worker_num_splits=2 -policy_workers_per_policy=1 -max_policy_lag=1000 -num_workers=8 -num_envs_per_worker=4 -batch_size=1024 -num_batches_per_epoch=1 -num_epochs=1 -rollout=32 -recurrence=32 -shuffle_minibatches=False -gamma=0.99 -reward_scale=1.0 -reward_clip=1000.0 -value_bootstrap=False -normalize_returns=True -exploration_loss_coeff=0.001 -value_loss_coeff=0.5 -kl_loss_coeff=0.0 -exploration_loss=symmetric_kl -gae_lambda=0.95 -ppo_clip_ratio=0.1 -ppo_clip_value=0.2 -with_vtrace=False -vtrace_rho=1.0 -vtrace_c=1.0 -optimizer=adam -adam_eps=1e-06 -adam_beta1=0.9 -adam_beta2=0.999 -max_grad_norm=4.0 -learning_rate=0.0001 -lr_schedule=constant -lr_schedule_kl_threshold=0.008 -lr_adaptive_min=1e-06 -lr_adaptive_max=0.01 -obs_subtract_mean=0.0 -obs_scale=255.0 -normalize_input=True -normalize_input_keys=None -decorrelate_experience_max_seconds=0 -decorrelate_envs_on_one_worker=True -actor_worker_gpus=[] -set_workers_cpu_affinity=True -force_envs_single_thread=False -default_niceness=0 -log_to_file=True -experiment_summaries_interval=10 -flush_summaries_interval=30 -stats_avg=100 -summaries_use_frameskip=True -heartbeat_interval=20 -heartbeat_reporting_interval=600 -train_for_env_steps=20000000 -train_for_seconds=10000000000 -save_every_sec=120 -keep_checkpoints=2 -load_checkpoint_kind=latest -save_milestones_sec=-1 -save_best_every_sec=5 -save_best_metric=reward -save_best_after=100000 -benchmark=False -encoder_mlp_layers=[512, 512] -encoder_conv_architecture=convnet_simple -encoder_conv_mlp_layers=[512] -use_rnn=True -rnn_size=512 -rnn_type=gru -rnn_num_layers=1 -decoder_mlp_layers=[] -nonlinearity=elu -policy_initialization=orthogonal -policy_init_gain=1.0 -actor_critic_share_weights=True -adaptive_stddev=True -continuous_tanh_scale=0.0 -initial_stddev=1.0 -use_env_info_cache=False -env_gpu_actions=False -env_gpu_observations=True -env_frameskip=4 -env_framestack=1 -pixel_format=CHW -use_record_episode_statistics=False -with_wandb=False -wandb_user=None -wandb_project=sample_factory -wandb_group=None -wandb_job_type=SF -wandb_tags=[] -with_pbt=False -pbt_mix_policies_in_one_env=True -pbt_period_env_steps=5000000 -pbt_start_mutation=20000000 -pbt_replace_fraction=0.3 -pbt_mutation_rate=0.15 -pbt_replace_reward_gap=0.1 -pbt_replace_reward_gap_absolute=1e-06 -pbt_optimize_gamma=False -pbt_target_objective=true_objective -pbt_perturb_min=1.1 -pbt_perturb_max=1.5 -num_agents=-1 -num_humans=0 -num_bots=-1 -start_bot_difficulty=None -timelimit=None -res_w=128 -res_h=72 -wide_aspect_ratio=False -eval_env_frameskip=1 -fps=35 -command_line=--env=doom_dm --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=20000000 -cli_args={'env': 'doom_dm', 'num_workers': 8, 'num_envs_per_worker': 4, 'train_for_env_steps': 20000000} -git_hash=20b6d44612dad7d171f23e13b1f3b4c5e5631cf9 -git_repo_name=https://github.com/MattStammers/optuna.git -[2023-09-12 18:24:14,820][129210] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... -[2023-09-12 18:24:15,827][129210] Rollout worker 0 uses device cpu -[2023-09-12 18:24:15,829][129210] Rollout worker 1 uses device cpu -[2023-09-12 18:24:15,830][129210] Rollout worker 2 uses device cpu -[2023-09-12 18:24:15,832][129210] Rollout worker 3 uses device cpu -[2023-09-12 18:24:15,834][129210] Rollout worker 4 uses device cpu -[2023-09-12 18:24:15,836][129210] Rollout worker 5 uses device cpu -[2023-09-12 18:24:15,837][129210] Rollout worker 6 uses device cpu -[2023-09-12 18:24:15,839][129210] Rollout worker 7 uses device cpu -[2023-09-12 18:24:16,016][129210] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 18:24:16,017][129210] InferenceWorker_p0-w0: min num requests: 2 -[2023-09-12 18:24:16,051][129210] Starting all processes... -[2023-09-12 18:24:16,052][129210] Starting process learner_proc0 -[2023-09-12 18:24:17,682][129210] Starting all processes... -[2023-09-12 18:24:17,684][09685] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 18:24:17,684][09685] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 -[2023-09-12 18:24:17,689][129210] Starting process inference_proc0-0 -[2023-09-12 18:24:17,689][129210] Starting process rollout_proc0 -[2023-09-12 18:24:17,690][129210] Starting process rollout_proc1 -[2023-09-12 18:24:17,690][129210] Starting process rollout_proc2 -[2023-09-12 18:24:17,691][129210] Starting process rollout_proc3 -[2023-09-12 18:24:17,691][129210] Starting process rollout_proc4 -[2023-09-12 18:24:17,692][129210] Starting process rollout_proc5 -[2023-09-12 18:24:17,725][09685] Num visible devices: 1 -[2023-09-12 18:24:17,692][129210] Starting process rollout_proc6 -[2023-09-12 18:24:17,693][129210] Starting process rollout_proc7 -[2023-09-12 18:24:17,774][09685] Starting seed is not provided -[2023-09-12 18:24:17,774][09685] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 18:24:17,774][09685] Initializing actor-critic model on device cuda:0 -[2023-09-12 18:24:17,775][09685] RunningMeanStd input shape: (23,) -[2023-09-12 18:24:17,775][09685] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 18:24:17,777][09685] RunningMeanStd input shape: (1,) -[2023-09-12 18:24:17,807][09685] ConvEncoder: input_channels=3 -[2023-09-12 18:24:18,010][09685] Conv encoder output size: 512 -[2023-09-12 18:24:18,011][09685] Policy head output size: 640 -[2023-09-12 18:24:18,040][09685] Created Actor Critic model with architecture: -[2023-09-12 18:24:18,040][09685] ActorCriticSharedWeights( +[2023-09-14 14:36:32,540][63454] Using optimizer +[2023-09-14 14:36:32,541][63454] No checkpoints found +[2023-09-14 14:36:32,541][63454] Did not load from checkpoint, starting from scratch! +[2023-09-14 14:36:32,541][63454] Initialized policy 0 weights for model version 0 +[2023-09-14 14:36:32,543][63454] LearnerWorker_p0 finished initialization! +[2023-09-14 14:36:32,543][63454] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 14:36:33,026][63576] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-09-14 14:36:33,026][63576] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for learning process 1 +[2023-09-14 14:36:33,064][63576] Num visible devices: 1 +[2023-09-14 14:36:33,107][63576] Starting seed is not provided +[2023-09-14 14:36:33,108][63576] Using GPUs [0] for process 1 (actually maps to GPUs [1]) +[2023-09-14 14:36:33,108][63576] Initializing actor-critic model on device cuda:0 +[2023-09-14 14:36:33,108][63576] RunningMeanStd input shape: (23,) +[2023-09-14 14:36:33,109][63576] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 14:36:33,109][63576] RunningMeanStd input shape: (1,) +[2023-09-14 14:36:33,130][63576] ConvEncoder: input_channels=3 +[2023-09-14 14:36:33,386][63576] Conv encoder output size: 512 +[2023-09-14 14:36:33,387][63576] Policy head output size: 640 +[2023-09-14 14:36:33,417][63576] Created Actor Critic model with architecture: +[2023-09-14 14:36:33,418][63576] ActorCriticSharedWeights( (obs_normalizer): ObservationNormalizer( (running_mean_std): RunningMeanStdDictInPlace( (running_mean_std): ModuleDict( @@ -1182,4962 +123,5341 @@ git_repo_name=https://github.com/MattStammers/optuna.git ) (critic_linear): Linear(in_features=512, out_features=1, bias=True) (action_parameterization): ActionParameterizationDefault( - (distribution_linear): Linear(in_features=512, out_features=15, bias=True) + (distribution_linear): Linear(in_features=512, out_features=39, bias=True) ) ) -[2023-09-12 18:24:19,420][09685] Using optimizer -[2023-09-12 18:24:19,421][09685] No checkpoints found -[2023-09-12 18:24:19,421][09685] Did not load from checkpoint, starting from scratch! -[2023-09-12 18:24:19,421][09685] Initialized policy 0 weights for model version 0 -[2023-09-12 18:24:19,423][09685] LearnerWorker_p0 finished initialization! -[2023-09-12 18:24:19,423][09685] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 18:24:19,746][09915] Worker 6 uses CPU cores [24, 25, 26, 27] -[2023-09-12 18:24:19,760][09823] Worker 2 uses CPU cores [8, 9, 10, 11] -[2023-09-12 18:24:19,771][09914] Worker 7 uses CPU cores [28, 29, 30, 31] -[2023-09-12 18:24:19,789][09855] Worker 4 uses CPU cores [16, 17, 18, 19] -[2023-09-12 18:24:19,831][09822] Worker 1 uses CPU cores [4, 5, 6, 7] -[2023-09-12 18:24:19,909][09860] Worker 3 uses CPU cores [12, 13, 14, 15] -[2023-09-12 18:24:19,938][09820] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 18:24:19,938][09820] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 -[2023-09-12 18:24:19,947][09821] Worker 0 uses CPU cores [0, 1, 2, 3] -[2023-09-12 18:24:19,959][09820] Num visible devices: 1 -[2023-09-12 18:24:20,137][09916] Worker 5 uses CPU cores [20, 21, 22, 23] -[2023-09-12 18:24:20,138][129210] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 0. Throughput: 0: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:24:20,648][09820] RunningMeanStd input shape: (23,) -[2023-09-12 18:24:20,648][09820] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 18:24:20,648][09820] RunningMeanStd input shape: (1,) -[2023-09-12 18:24:20,660][09820] ConvEncoder: input_channels=3 -[2023-09-12 18:24:20,760][09820] Conv encoder output size: 512 -[2023-09-12 18:24:20,761][09820] Policy head output size: 640 -[2023-09-12 18:24:21,105][129210] Inference worker 0-0 is ready! -[2023-09-12 18:24:21,107][129210] All inference workers are ready! Signal rollout workers to start! -[2023-09-12 18:24:21,111][09860] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,112][09914] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,112][09822] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,113][09916] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,114][09855] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,114][09821] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,114][09823] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,114][09915] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,143][09860] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:24:21,147][09860] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,147][09914] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:24:21,148][09822] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:24:21,151][09916] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:24:21,152][09914] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,153][09822] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,156][09916] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,166][09823] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:24:21,166][09915] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:24:21,166][09855] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:24:21,166][09821] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 18:24:21,172][09823] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,172][09915] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,172][09821] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,172][09855] Multi agent env, num agents: 8 -[2023-09-12 18:24:21,204][09916] Port 40800 is available -[2023-09-12 18:24:21,204][09822] Port 40400 is available -[2023-09-12 18:24:21,204][09916] Using port 40800 -[2023-09-12 18:24:21,204][09822] Using port 40400 -[2023-09-12 18:24:21,204][09914] Port 41000 is available -[2023-09-12 18:24:21,205][09914] Using port 41000 -[2023-09-12 18:24:21,205][09916] Initializing env for player 0, init_info: {'port': 40800}... -[2023-09-12 18:24:21,205][09822] Initializing env for player 0, init_info: {'port': 40400}... -[2023-09-12 18:24:21,206][09914] Initializing env for player 0, init_info: {'port': 41000}... -[2023-09-12 18:24:21,223][09821] Port 40300 is available -[2023-09-12 18:24:21,223][09821] Using port 40300 -[2023-09-12 18:24:21,223][09823] Port 40500 is available -[2023-09-12 18:24:21,223][09823] Using port 40500 -[2023-09-12 18:24:21,223][09855] Port 40700 is available -[2023-09-12 18:24:21,223][09855] Using port 40700 -[2023-09-12 18:24:21,224][09823] Initializing env for player 0, init_info: {'port': 40500}... -[2023-09-12 18:24:21,224][09821] Initializing env for player 0, init_info: {'port': 40300}... -[2023-09-12 18:24:21,224][09915] Port 40900 is available -[2023-09-12 18:24:21,224][09915] Using port 40900 -[2023-09-12 18:24:21,224][09855] Initializing env for player 0, init_info: {'port': 40700}... -[2023-09-12 18:24:21,225][09915] Initializing env for player 0, init_info: {'port': 40900}... -[2023-09-12 18:24:21,236][09822] Using port 40400 on host... -[2023-09-12 18:24:21,238][09916] Using port 40800 on host... -[2023-09-12 18:24:21,251][09914] Using port 41000 on host... -[2023-09-12 18:24:21,254][09855] Using port 40700 on host... -[2023-09-12 18:24:21,256][09916] Initializing env for player 1, init_info: {'port': 40800}... -[2023-09-12 18:24:21,256][09822] Initializing env for player 1, init_info: {'port': 40400}... -[2023-09-12 18:24:21,259][09860] Port 40600 is available -[2023-09-12 18:24:21,259][09860] Using port 40600 -[2023-09-12 18:24:21,259][09914] Initializing env for player 1, init_info: {'port': 41000}... -[2023-09-12 18:24:21,260][09821] Using port 40300 on host... -[2023-09-12 18:24:21,260][09860] Initializing env for player 0, init_info: {'port': 40600}... -[2023-09-12 18:24:21,273][09823] Using port 40500 on host... -[2023-09-12 18:24:21,274][09915] Using port 40900 on host... -[2023-09-12 18:24:21,275][09855] Initializing env for player 1, init_info: {'port': 40700}... -[2023-09-12 18:24:21,276][09821] Initializing env for player 1, init_info: {'port': 40300}... -[2023-09-12 18:24:21,275][09915] Initializing env for player 1, init_info: {'port': 40900}... -[2023-09-12 18:24:21,283][09823] Initializing env for player 1, init_info: {'port': 40500}... -[2023-09-12 18:24:21,292][09860] Using port 40600 on host... -[2023-09-12 18:24:21,306][09916] Initializing env for player 2, init_info: {'port': 40800}... -[2023-09-12 18:24:21,309][09822] Initializing env for player 2, init_info: {'port': 40400}... -[2023-09-12 18:24:21,310][09914] Initializing env for player 2, init_info: {'port': 41000}... -[2023-09-12 18:24:21,311][09860] Initializing env for player 1, init_info: {'port': 40600}... -[2023-09-12 18:24:21,325][09823] Initializing env for player 2, init_info: {'port': 40500}... -[2023-09-12 18:24:21,325][09855] Initializing env for player 2, init_info: {'port': 40700}... -[2023-09-12 18:24:21,326][09915] Initializing env for player 2, init_info: {'port': 40900}... -[2023-09-12 18:24:21,326][09821] Initializing env for player 2, init_info: {'port': 40300}... -[2023-09-12 18:24:21,359][09916] Initializing env for player 3, init_info: {'port': 40800}... -[2023-09-12 18:24:21,361][09860] Initializing env for player 2, init_info: {'port': 40600}... -[2023-09-12 18:24:21,361][09914] Initializing env for player 3, init_info: {'port': 41000}... -[2023-09-12 18:24:21,363][09822] Initializing env for player 3, init_info: {'port': 40400}... -[2023-09-12 18:24:21,375][09823] Initializing env for player 3, init_info: {'port': 40500}... -[2023-09-12 18:24:21,376][09915] Initializing env for player 3, init_info: {'port': 40900}... -[2023-09-12 18:24:21,379][09855] Initializing env for player 3, init_info: {'port': 40700}... -[2023-09-12 18:24:21,379][09821] Initializing env for player 3, init_info: {'port': 40300}... -[2023-09-12 18:24:21,411][09914] Initializing env for player 4, init_info: {'port': 41000}... -[2023-09-12 18:24:21,411][09822] Initializing env for player 4, init_info: {'port': 40400}... -[2023-09-12 18:24:21,415][09860] Initializing env for player 3, init_info: {'port': 40600}... -[2023-09-12 18:24:21,421][09916] Initializing env for player 4, init_info: {'port': 40800}... -[2023-09-12 18:24:21,426][09823] Initializing env for player 4, init_info: {'port': 40500}... -[2023-09-12 18:24:21,431][09855] Initializing env for player 4, init_info: {'port': 40700}... -[2023-09-12 18:24:21,435][09821] Initializing env for player 4, init_info: {'port': 40300}... -[2023-09-12 18:24:21,434][09915] Initializing env for player 4, init_info: {'port': 40900}... -[2023-09-12 18:24:21,467][09860] Initializing env for player 4, init_info: {'port': 40600}... -[2023-09-12 18:24:21,467][09914] Initializing env for player 5, init_info: {'port': 41000}... -[2023-09-12 18:24:21,480][09823] Initializing env for player 5, init_info: {'port': 40500}... -[2023-09-12 18:24:21,481][09855] Initializing env for player 5, init_info: {'port': 40700}... -[2023-09-12 18:24:21,476][09822] Initializing env for player 5, init_info: {'port': 40400}... -[2023-09-12 18:24:21,486][09821] Initializing env for player 5, init_info: {'port': 40300}... -[2023-09-12 18:24:21,492][09915] Initializing env for player 5, init_info: {'port': 40900}... -[2023-09-12 18:24:21,497][09916] Initializing env for player 5, init_info: {'port': 40800}... -[2023-09-12 18:24:21,518][09914] Initializing env for player 6, init_info: {'port': 41000}... -[2023-09-12 18:24:21,525][09860] Initializing env for player 5, init_info: {'port': 40600}... -[2023-09-12 18:24:21,526][09822] Initializing env for player 6, init_info: {'port': 40400}... -[2023-09-12 18:24:21,528][09823] Initializing env for player 6, init_info: {'port': 40500}... -[2023-09-12 18:24:21,532][09855] Initializing env for player 6, init_info: {'port': 40700}... -[2023-09-12 18:24:21,539][09821] Initializing env for player 6, init_info: {'port': 40300}... -[2023-09-12 18:24:21,551][09916] Initializing env for player 6, init_info: {'port': 40800}... -[2023-09-12 18:24:21,542][09915] Initializing env for player 6, init_info: {'port': 40900}... -[2023-09-12 18:24:21,579][09822] Initializing env for player 7, init_info: {'port': 40400}... -[2023-09-12 18:24:21,579][09860] Initializing env for player 6, init_info: {'port': 40600}... -[2023-09-12 18:24:21,582][09823] Initializing env for player 7, init_info: {'port': 40500}... -[2023-09-12 18:24:21,588][09821] Initializing env for player 7, init_info: {'port': 40300}... -[2023-09-12 18:24:21,593][09915] Initializing env for player 7, init_info: {'port': 40900}... -[2023-09-12 18:24:21,595][09855] Initializing env for player 7, init_info: {'port': 40700}... -[2023-09-12 18:24:21,596][09914] Initializing env for player 7, init_info: {'port': 41000}... -[2023-09-12 18:24:21,607][09916] Initializing env for player 7, init_info: {'port': 40800}... -[2023-09-12 18:24:21,651][09860] Initializing env for player 7, init_info: {'port': 40600}... -[2023-09-12 18:24:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:24:23,206][09915] Initialized w:6 v:0 player:7 -[2023-09-12 18:24:23,209][09915] Initialized w:6 v:0 player:3 -[2023-09-12 18:24:23,209][09915] Initialized w:6 v:0 player:1 -[2023-09-12 18:24:23,210][09915] Initialized w:6 v:0 player:2 -[2023-09-12 18:24:23,210][09915] Initialized w:6 v:0 player:5 -[2023-09-12 18:24:23,210][09915] Initialized w:6 v:0 player:0 -[2023-09-12 18:24:23,211][09915] Initialized w:6 v:0 player:6 -[2023-09-12 18:24:23,212][09915] Initialized w:6 v:0 player:4 -[2023-09-12 18:24:23,213][09915] 8 agent workers initialized for env 6! -[2023-09-12 18:24:23,234][09823] Initialized w:2 v:0 player:0 -[2023-09-12 18:24:23,235][09823] Initialized w:2 v:0 player:6 -[2023-09-12 18:24:23,236][09823] Initialized w:2 v:0 player:4 -[2023-09-12 18:24:23,237][09823] Initialized w:2 v:0 player:1 -[2023-09-12 18:24:23,237][09823] Initialized w:2 v:0 player:7 -[2023-09-12 18:24:23,238][09823] Initialized w:2 v:0 player:5 -[2023-09-12 18:24:23,238][09823] Initialized w:2 v:0 player:2 -[2023-09-12 18:24:23,238][09823] Initialized w:2 v:0 player:3 -[2023-09-12 18:24:23,241][09823] 8 agent workers initialized for env 2! -[2023-09-12 18:24:23,259][09821] Initialized w:0 v:0 player:0 -[2023-09-12 18:24:23,262][09821] Initialized w:0 v:0 player:4 -[2023-09-12 18:24:23,263][09821] Initialized w:0 v:0 player:3 -[2023-09-12 18:24:23,263][09821] Initialized w:0 v:0 player:2 -[2023-09-12 18:24:23,263][09821] Initialized w:0 v:0 player:1 -[2023-09-12 18:24:23,263][09821] Initialized w:0 v:0 player:7 -[2023-09-12 18:24:23,263][09821] Initialized w:0 v:0 player:6 -[2023-09-12 18:24:23,264][09821] Initialized w:0 v:0 player:5 -[2023-09-12 18:24:23,266][09915] Decorrelating experience for 0 frames... -[2023-09-12 18:24:23,267][09821] 8 agent workers initialized for env 0! -[2023-09-12 18:24:23,268][09915] Port 40901 is available -[2023-09-12 18:24:23,268][09915] Using port 40901 -[2023-09-12 18:24:23,271][09822] Initialized w:1 v:0 player:4 -[2023-09-12 18:24:23,272][09822] Initialized w:1 v:0 player:2 -[2023-09-12 18:24:23,272][09822] Initialized w:1 v:0 player:5 -[2023-09-12 18:24:23,273][09822] Initialized w:1 v:0 player:3 -[2023-09-12 18:24:23,274][09822] Initialized w:1 v:0 player:1 -[2023-09-12 18:24:23,274][09822] Initialized w:1 v:0 player:6 -[2023-09-12 18:24:23,274][09822] Initialized w:1 v:0 player:7 -[2023-09-12 18:24:23,275][09822] Initialized w:1 v:0 player:0 -[2023-09-12 18:24:23,276][09822] 8 agent workers initialized for env 1! -[2023-09-12 18:24:23,277][09916] Initialized w:5 v:0 player:5 -[2023-09-12 18:24:23,280][09916] Initialized w:5 v:0 player:4 -[2023-09-12 18:24:23,281][09916] Initialized w:5 v:0 player:3 -[2023-09-12 18:24:23,281][09916] Initialized w:5 v:0 player:6 -[2023-09-12 18:24:23,281][09916] Initialized w:5 v:0 player:0 -[2023-09-12 18:24:23,282][09916] Initialized w:5 v:0 player:2 -[2023-09-12 18:24:23,287][09916] Initialized w:5 v:0 player:7 -[2023-09-12 18:24:23,296][09823] Decorrelating experience for 0 frames... -[2023-09-12 18:24:23,297][09823] Port 40501 is available -[2023-09-12 18:24:23,297][09823] Using port 40501 -[2023-09-12 18:24:23,298][09823] Initializing env for player 0, init_info: {'port': 40501}... -[2023-09-12 18:24:23,307][09855] Initialized w:4 v:0 player:3 -[2023-09-12 18:24:23,310][09855] Initialized w:4 v:0 player:5 -[2023-09-12 18:24:23,310][09855] Initialized w:4 v:0 player:0 -[2023-09-12 18:24:23,311][09855] Initialized w:4 v:0 player:4 -[2023-09-12 18:24:23,312][09855] Initialized w:4 v:0 player:7 -[2023-09-12 18:24:23,312][09855] Initialized w:4 v:0 player:6 -[2023-09-12 18:24:23,312][09855] Initialized w:4 v:0 player:2 -[2023-09-12 18:24:23,312][09855] Initialized w:4 v:0 player:1 -[2023-09-12 18:24:23,315][09855] 8 agent workers initialized for env 4! -[2023-09-12 18:24:23,316][09822] Decorrelating experience for 0 frames... -[2023-09-12 18:24:23,317][09822] Port 40401 is available -[2023-09-12 18:24:23,317][09822] Using port 40401 -[2023-09-12 18:24:23,318][09822] Initializing env for player 0, init_info: {'port': 40401}... -[2023-09-12 18:24:23,320][09821] Decorrelating experience for 0 frames... -[2023-09-12 18:24:23,322][09821] Port 40301 is available -[2023-09-12 18:24:23,323][09821] Using port 40301 -[2023-09-12 18:24:23,323][09821] Initializing env for player 0, init_info: {'port': 40301}... -[2023-09-12 18:24:23,327][09823] Using port 40501 on host... -[2023-09-12 18:24:23,346][09822] Using port 40401 on host... -[2023-09-12 18:24:23,348][09823] Initializing env for player 1, init_info: {'port': 40501}... -[2023-09-12 18:24:23,366][09821] Using port 40301 on host... -[2023-09-12 18:24:23,368][09822] Initializing env for player 1, init_info: {'port': 40401}... -[2023-09-12 18:24:23,376][09855] Decorrelating experience for 0 frames... -[2023-09-12 18:24:23,376][09821] Initializing env for player 1, init_info: {'port': 40301}... -[2023-09-12 18:24:23,377][09855] Port 40701 is available -[2023-09-12 18:24:23,378][09855] Using port 40701 -[2023-09-12 18:24:23,399][09823] Initializing env for player 2, init_info: {'port': 40501}... -[2023-09-12 18:24:23,419][09822] Initializing env for player 2, init_info: {'port': 40401}... -[2023-09-12 18:24:23,426][09821] Initializing env for player 2, init_info: {'port': 40301}... -[2023-09-12 18:24:23,434][09860] Initialized w:3 v:0 player:4 -[2023-09-12 18:24:23,435][09860] Initialized w:3 v:0 player:6 -[2023-09-12 18:24:23,436][09860] Initialized w:3 v:0 player:7 -[2023-09-12 18:24:23,436][09860] Initialized w:3 v:0 player:3 -[2023-09-12 18:24:23,437][09860] Initialized w:3 v:0 player:1 -[2023-09-12 18:24:23,437][09860] Initialized w:3 v:0 player:0 -[2023-09-12 18:24:23,438][09860] Initialized w:3 v:0 player:5 -[2023-09-12 18:24:23,439][09860] Initialized w:3 v:0 player:2 -[2023-09-12 18:24:23,440][09860] 8 agent workers initialized for env 3! -[2023-09-12 18:24:23,455][09823] Initializing env for player 3, init_info: {'port': 40501}... -[2023-09-12 18:24:23,469][09822] Initializing env for player 3, init_info: {'port': 40401}... -[2023-09-12 18:24:23,479][09821] Initializing env for player 3, init_info: {'port': 40301}... -[2023-09-12 18:24:23,494][09860] Decorrelating experience for 0 frames... -[2023-09-12 18:24:23,496][09860] Port 40601 is available -[2023-09-12 18:24:23,496][09860] Using port 40601 -[2023-09-12 18:24:23,497][09860] Initializing env for player 0, init_info: {'port': 40601}... -[2023-09-12 18:24:23,507][09823] Initializing env for player 4, init_info: {'port': 40501}... -[2023-09-12 18:24:23,531][09821] Initializing env for player 4, init_info: {'port': 40301}... -[2023-09-12 18:24:23,539][09822] Initializing env for player 4, init_info: {'port': 40401}... -[2023-09-12 18:24:23,542][09860] Using port 40601 on host... -[2023-09-12 18:24:23,551][09860] Initializing env for player 1, init_info: {'port': 40601}... -[2023-09-12 18:24:23,555][09823] Initializing env for player 5, init_info: {'port': 40501}... -[2023-09-12 18:24:23,567][09914] Initialized w:7 v:0 player:0 -[2023-09-12 18:24:23,569][09914] Initialized w:7 v:0 player:6 -[2023-09-12 18:24:23,570][09914] Initialized w:7 v:0 player:4 -[2023-09-12 18:24:23,571][09914] Initialized w:7 v:0 player:2 -[2023-09-12 18:24:23,571][09914] Initialized w:7 v:0 player:5 -[2023-09-12 18:24:23,571][09914] Initialized w:7 v:0 player:1 -[2023-09-12 18:24:23,571][09914] Initialized w:7 v:0 player:7 -[2023-09-12 18:24:23,572][09914] Initialized w:7 v:0 player:3 -[2023-09-12 18:24:23,574][09914] 8 agent workers initialized for env 7! -[2023-09-12 18:24:23,589][09821] Initializing env for player 5, init_info: {'port': 40301}... -[2023-09-12 18:24:23,595][09822] Initializing env for player 5, init_info: {'port': 40401}... -[2023-09-12 18:24:23,601][09860] Initializing env for player 2, init_info: {'port': 40601}... -[2023-09-12 18:24:23,607][09823] Initializing env for player 6, init_info: {'port': 40501}... -[2023-09-12 18:24:23,635][09914] Decorrelating experience for 0 frames... -[2023-09-12 18:24:23,637][09914] Port 41001 is available -[2023-09-12 18:24:23,637][09914] Using port 41001 -[2023-09-12 18:24:23,638][09914] Initializing env for player 0, init_info: {'port': 41001}... -[2023-09-12 18:24:23,643][09821] Initializing env for player 6, init_info: {'port': 40301}... -[2023-09-12 18:24:23,647][09822] Initializing env for player 6, init_info: {'port': 40401}... -[2023-09-12 18:24:23,655][09860] Initializing env for player 3, init_info: {'port': 40601}... -[2023-09-12 18:24:23,663][09823] Initializing env for player 7, init_info: {'port': 40501}... -[2023-09-12 18:24:23,684][09914] Using port 41001 on host... -[2023-09-12 18:24:23,693][09914] Initializing env for player 1, init_info: {'port': 41001}... -[2023-09-12 18:24:23,693][09821] Initializing env for player 7, init_info: {'port': 40301}... -[2023-09-12 18:24:23,707][09822] Initializing env for player 7, init_info: {'port': 40401}... -[2023-09-12 18:24:23,711][09860] Initializing env for player 4, init_info: {'port': 40601}... -[2023-09-12 18:24:23,747][09914] Initializing env for player 2, init_info: {'port': 41001}... -[2023-09-12 18:24:23,759][09860] Initializing env for player 5, init_info: {'port': 40601}... -[2023-09-12 18:24:23,798][09914] Initializing env for player 3, init_info: {'port': 41001}... -[2023-09-12 18:24:23,811][09860] Initializing env for player 6, init_info: {'port': 40601}... -[2023-09-12 18:24:23,859][09914] Initializing env for player 4, init_info: {'port': 41001}... -[2023-09-12 18:24:23,875][09860] Initializing env for player 7, init_info: {'port': 40601}... -[2023-09-12 18:24:23,919][09914] Initializing env for player 5, init_info: {'port': 41001}... -[2023-09-12 18:24:23,971][09914] Initializing env for player 6, init_info: {'port': 41001}... -[2023-09-12 18:24:24,023][09914] Initializing env for player 7, init_info: {'port': 41001}... -[2023-09-12 18:24:24,277][09916] Initialized w:5 v:0 player:1 -[2023-09-12 18:24:24,279][09916] 8 agent workers initialized for env 5! -[2023-09-12 18:24:24,296][09855] Initializing env for player 0, init_info: {'port': 40701}... -[2023-09-12 18:24:24,331][09855] Using port 40701 on host... -[2023-09-12 18:24:24,346][09855] Initializing env for player 1, init_info: {'port': 40701}... -[2023-09-12 18:24:24,367][09916] Decorrelating experience for 0 frames... -[2023-09-12 18:24:24,369][09916] Port 40801 is available -[2023-09-12 18:24:24,369][09916] Using port 40801 -[2023-09-12 18:24:24,370][09916] Initializing env for player 0, init_info: {'port': 40801}... -[2023-09-12 18:24:24,397][09855] Initializing env for player 2, init_info: {'port': 40701}... -[2023-09-12 18:24:24,399][09916] Using port 40801 on host... -[2023-09-12 18:24:24,420][09916] Initializing env for player 1, init_info: {'port': 40801}... -[2023-09-12 18:24:24,447][09855] Initializing env for player 3, init_info: {'port': 40701}... -[2023-09-12 18:24:24,471][09916] Initializing env for player 2, init_info: {'port': 40801}... -[2023-09-12 18:24:24,499][09855] Initializing env for player 4, init_info: {'port': 40701}... -[2023-09-12 18:24:24,527][09916] Initializing env for player 3, init_info: {'port': 40801}... -[2023-09-12 18:24:24,551][09855] Initializing env for player 5, init_info: {'port': 40701}... -[2023-09-12 18:24:24,579][09916] Initializing env for player 4, init_info: {'port': 40801}... -[2023-09-12 18:24:24,607][09855] Initializing env for player 6, init_info: {'port': 40701}... -[2023-09-12 18:24:24,634][09916] Initializing env for player 5, init_info: {'port': 40801}... -[2023-09-12 18:24:24,659][09855] Initializing env for player 7, init_info: {'port': 40701}... -[2023-09-12 18:24:24,687][09916] Initializing env for player 6, init_info: {'port': 40801}... -[2023-09-12 18:24:24,743][09916] Initializing env for player 7, init_info: {'port': 40801}... -[2023-09-12 18:24:24,922][09823] Initialized w:2 v:1 player:6 -[2023-09-12 18:24:24,924][09823] Initialized w:2 v:1 player:7 -[2023-09-12 18:24:24,925][09823] Initialized w:2 v:1 player:5 -[2023-09-12 18:24:24,925][09823] Initialized w:2 v:1 player:2 -[2023-09-12 18:24:24,926][09823] Initialized w:2 v:1 player:4 -[2023-09-12 18:24:24,925][09823] Initialized w:2 v:1 player:0 -[2023-09-12 18:24:24,928][09823] Initialized w:2 v:1 player:3 -[2023-09-12 18:24:24,929][09823] Initialized w:2 v:1 player:1 -[2023-09-12 18:24:24,930][09823] 8 agent workers initialized for env 2! -[2023-09-12 18:24:24,960][09821] Initialized w:0 v:1 player:5 -[2023-09-12 18:24:24,961][09821] Initialized w:0 v:1 player:7 -[2023-09-12 18:24:24,963][09821] Initialized w:0 v:1 player:1 -[2023-09-12 18:24:24,963][09821] Initialized w:0 v:1 player:4 -[2023-09-12 18:24:24,963][09821] Initialized w:0 v:1 player:6 -[2023-09-12 18:24:24,964][09821] Initialized w:0 v:1 player:2 -[2023-09-12 18:24:24,964][09821] Initialized w:0 v:1 player:3 -[2023-09-12 18:24:24,964][09821] Initialized w:0 v:1 player:0 -[2023-09-12 18:24:24,966][09821] 8 agent workers initialized for env 0! -[2023-09-12 18:24:24,978][09822] Initialized w:1 v:1 player:4 -[2023-09-12 18:24:24,980][09822] Initialized w:1 v:1 player:0 -[2023-09-12 18:24:24,982][09822] Initialized w:1 v:1 player:5 -[2023-09-12 18:24:24,982][09822] Initialized w:1 v:1 player:1 -[2023-09-12 18:24:24,984][09822] Initialized w:1 v:1 player:2 -[2023-09-12 18:24:24,984][09822] Initialized w:1 v:1 player:6 -[2023-09-12 18:24:24,985][09822] Initialized w:1 v:1 player:7 -[2023-09-12 18:24:24,985][09822] Initialized w:1 v:1 player:3 -[2023-09-12 18:24:24,987][09822] 8 agent workers initialized for env 1! -[2023-09-12 18:24:24,990][09915] Initializing env for player 0, init_info: {'port': 40901}... -[2023-09-12 18:24:24,996][09823] Decorrelating experience for 32 frames... -[2023-09-12 18:24:25,013][09821] Decorrelating experience for 32 frames... -[2023-09-12 18:24:25,029][09915] Using port 40901 on host... -[2023-09-12 18:24:25,051][09915] Initializing env for player 1, init_info: {'port': 40901}... -[2023-09-12 18:24:25,057][09822] Decorrelating experience for 32 frames... -[2023-09-12 18:24:25,111][09915] Initializing env for player 2, init_info: {'port': 40901}... -[2023-09-12 18:24:25,167][09915] Initializing env for player 3, init_info: {'port': 40901}... -[2023-09-12 18:24:25,231][09915] Initializing env for player 4, init_info: {'port': 40901}... -[2023-09-12 18:24:25,279][09915] Initializing env for player 5, init_info: {'port': 40901}... -[2023-09-12 18:24:25,313][09821] Multi agent env, num agents: 8 -[2023-09-12 18:24:25,335][09915] Initializing env for player 6, init_info: {'port': 40901}... -[2023-09-12 18:24:25,344][09821] Multi agent env, num agents: 8 -[2023-09-12 18:24:25,383][09915] Initializing env for player 7, init_info: {'port': 40901}... -[2023-09-12 18:24:25,383][09821] Port 40302 is available -[2023-09-12 18:24:25,383][09821] Using port 40302 -[2023-09-12 18:24:25,394][09821] Initializing env for player 0, init_info: {'port': 40302}... -[2023-09-12 18:24:25,399][09860] Initialized w:3 v:1 player:0 -[2023-09-12 18:24:25,400][09914] Initialized w:7 v:1 player:1 -[2023-09-12 18:24:25,402][09914] Initialized w:7 v:1 player:6 -[2023-09-12 18:24:25,402][09860] Initialized w:3 v:1 player:2 -[2023-09-12 18:24:25,403][09914] Initialized w:7 v:1 player:7 -[2023-09-12 18:24:25,403][09860] Initialized w:3 v:1 player:6 -[2023-09-12 18:24:25,403][09860] Initialized w:3 v:1 player:4 -[2023-09-12 18:24:25,403][09860] Initialized w:3 v:1 player:7 -[2023-09-12 18:24:25,404][09914] Initialized w:7 v:1 player:0 -[2023-09-12 18:24:25,404][09914] Initialized w:7 v:1 player:2 -[2023-09-12 18:24:25,404][09860] Initialized w:3 v:1 player:1 -[2023-09-12 18:24:25,404][09914] Initialized w:7 v:1 player:4 -[2023-09-12 18:24:25,405][09914] Initialized w:7 v:1 player:3 -[2023-09-12 18:24:25,404][09860] Initialized w:3 v:1 player:5 -[2023-09-12 18:24:25,404][09860] Initialized w:3 v:1 player:3 -[2023-09-12 18:24:25,406][09860] 8 agent workers initialized for env 3! -[2023-09-12 18:24:25,434][09821] Initializing env for player 1, init_info: {'port': 40302}... -[2023-09-12 18:24:25,437][09822] Multi agent env, num agents: 8 -[2023-09-12 18:24:25,439][09821] Using port 40302 on host... -[2023-09-12 18:24:25,441][09860] Decorrelating experience for 32 frames... -[2023-09-12 18:24:25,484][09822] Multi agent env, num agents: 8 -[2023-09-12 18:24:25,486][09821] Initializing env for player 2, init_info: {'port': 40302}... -[2023-09-12 18:24:25,503][09823] Multi agent env, num agents: 8 -[2023-09-12 18:24:25,531][09822] Port 40402 is available -[2023-09-12 18:24:25,531][09822] Using port 40402 -[2023-09-12 18:24:25,531][09822] Initializing env for player 0, init_info: {'port': 40402}... -[2023-09-12 18:24:25,546][09821] Initializing env for player 3, init_info: {'port': 40302}... -[2023-09-12 18:24:25,550][09823] Multi agent env, num agents: 8 -[2023-09-12 18:24:25,566][09822] Using port 40402 on host... -[2023-09-12 18:24:25,583][09822] Initializing env for player 1, init_info: {'port': 40402}... -[2023-09-12 18:24:25,596][09823] Port 40502 is available -[2023-09-12 18:24:25,596][09821] Initializing env for player 4, init_info: {'port': 40302}... -[2023-09-12 18:24:25,597][09823] Using port 40502 -[2023-09-12 18:24:25,597][09823] Initializing env for player 0, init_info: {'port': 40502}... -[2023-09-12 18:24:25,642][09823] Using port 40502 on host... -[2023-09-12 18:24:25,642][09822] Initializing env for player 2, init_info: {'port': 40402}... -[2023-09-12 18:24:25,647][09821] Initializing env for player 5, init_info: {'port': 40302}... -[2023-09-12 18:24:25,653][09823] Initializing env for player 1, init_info: {'port': 40502}... -[2023-09-12 18:24:25,701][09821] Initializing env for player 6, init_info: {'port': 40302}... -[2023-09-12 18:24:25,701][09822] Initializing env for player 3, init_info: {'port': 40402}... -[2023-09-12 18:24:25,710][09823] Initializing env for player 2, init_info: {'port': 40502}... -[2023-09-12 18:24:25,759][09821] Initializing env for player 7, init_info: {'port': 40302}... -[2023-09-12 18:24:25,758][09822] Initializing env for player 4, init_info: {'port': 40402}... -[2023-09-12 18:24:25,776][09823] Initializing env for player 3, init_info: {'port': 40502}... -[2023-09-12 18:24:25,794][09860] Multi agent env, num agents: 8 -[2023-09-12 18:24:25,807][09822] Initializing env for player 5, init_info: {'port': 40402}... -[2023-09-12 18:24:25,823][09823] Initializing env for player 4, init_info: {'port': 40502}... -[2023-09-12 18:24:25,829][09860] Multi agent env, num agents: 8 -[2023-09-12 18:24:25,859][09822] Initializing env for player 6, init_info: {'port': 40402}... -[2023-09-12 18:24:25,861][09860] Port 40602 is available -[2023-09-12 18:24:25,861][09860] Using port 40602 -[2023-09-12 18:24:25,875][09823] Initializing env for player 5, init_info: {'port': 40502}... -[2023-09-12 18:24:25,914][09822] Initializing env for player 7, init_info: {'port': 40402}... -[2023-09-12 18:24:25,925][09823] Initializing env for player 6, init_info: {'port': 40502}... -[2023-09-12 18:24:26,003][09823] Initializing env for player 7, init_info: {'port': 40502}... -[2023-09-12 18:24:26,045][09855] Initialized w:4 v:1 player:2 -[2023-09-12 18:24:26,046][09855] Initialized w:4 v:1 player:0 -[2023-09-12 18:24:26,047][09855] Initialized w:4 v:1 player:1 -[2023-09-12 18:24:26,047][09855] Initialized w:4 v:1 player:6 -[2023-09-12 18:24:26,047][09855] Initialized w:4 v:1 player:5 -[2023-09-12 18:24:26,048][09855] Initialized w:4 v:1 player:7 -[2023-09-12 18:24:26,050][09855] Initialized w:4 v:1 player:4 -[2023-09-12 18:24:26,050][09855] Initialized w:4 v:1 player:3 -[2023-09-12 18:24:26,052][09855] 8 agent workers initialized for env 4! -[2023-09-12 18:24:26,100][09855] Decorrelating experience for 32 frames... -[2023-09-12 18:24:26,202][09916] Initialized w:5 v:1 player:6 -[2023-09-12 18:24:26,203][09916] Initialized w:5 v:1 player:5 -[2023-09-12 18:24:26,205][09916] Initialized w:5 v:1 player:3 -[2023-09-12 18:24:26,205][09916] Initialized w:5 v:1 player:0 -[2023-09-12 18:24:26,206][09916] Initialized w:5 v:1 player:1 -[2023-09-12 18:24:26,207][09916] Initialized w:5 v:1 player:7 -[2023-09-12 18:24:26,207][09916] Initialized w:5 v:1 player:4 -[2023-09-12 18:24:26,207][09916] Initialized w:5 v:1 player:2 -[2023-09-12 18:24:26,208][09916] 8 agent workers initialized for env 5! -[2023-09-12 18:24:26,246][09916] Decorrelating experience for 32 frames... -[2023-09-12 18:24:26,430][09855] Multi agent env, num agents: 8 -[2023-09-12 18:24:26,461][09855] Multi agent env, num agents: 8 -[2023-09-12 18:24:26,494][09855] Port 40702 is available -[2023-09-12 18:24:26,494][09855] Using port 40702 -[2023-09-12 18:24:26,495][09855] Initializing env for player 0, init_info: {'port': 40702}... -[2023-09-12 18:24:26,521][09916] Multi agent env, num agents: 8 -[2023-09-12 18:24:26,526][09855] Using port 40702 on host... -[2023-09-12 18:24:26,546][09855] Initializing env for player 1, init_info: {'port': 40702}... -[2023-09-12 18:24:26,551][09916] Multi agent env, num agents: 8 -[2023-09-12 18:24:26,580][09916] Port 40802 is available -[2023-09-12 18:24:26,581][09916] Using port 40802 -[2023-09-12 18:24:26,596][09855] Initializing env for player 2, init_info: {'port': 40702}... -[2023-09-12 18:24:26,647][09855] Initializing env for player 3, init_info: {'port': 40702}... -[2023-09-12 18:24:26,703][09855] Initializing env for player 4, init_info: {'port': 40702}... -[2023-09-12 18:24:26,755][09855] Initializing env for player 5, init_info: {'port': 40702}... -[2023-09-12 18:24:26,779][09915] Initialized w:6 v:1 player:0 -[2023-09-12 18:24:26,780][09915] Initialized w:6 v:1 player:5 -[2023-09-12 18:24:26,780][09915] Initialized w:6 v:1 player:7 -[2023-09-12 18:24:26,782][09915] Initialized w:6 v:1 player:3 -[2023-09-12 18:24:26,782][09915] Initialized w:6 v:1 player:2 -[2023-09-12 18:24:26,782][09915] Initialized w:6 v:1 player:4 -[2023-09-12 18:24:26,782][09915] Initialized w:6 v:1 player:1 -[2023-09-12 18:24:26,782][09915] Initialized w:6 v:1 player:6 -[2023-09-12 18:24:26,784][09915] 8 agent workers initialized for env 6! -[2023-09-12 18:24:26,803][09855] Initializing env for player 6, init_info: {'port': 40702}... -[2023-09-12 18:24:26,816][09915] Decorrelating experience for 32 frames... -[2023-09-12 18:24:26,856][09855] Initializing env for player 7, init_info: {'port': 40702}... -[2023-09-12 18:24:27,086][09821] Initialized w:0 v:2 player:4 -[2023-09-12 18:24:27,089][09821] Initialized w:0 v:2 player:5 -[2023-09-12 18:24:27,089][09821] Initialized w:0 v:2 player:0 -[2023-09-12 18:24:27,091][09821] Initialized w:0 v:2 player:6 -[2023-09-12 18:24:27,096][09821] Initialized w:0 v:2 player:2 -[2023-09-12 18:24:27,096][09821] Initialized w:0 v:2 player:1 -[2023-09-12 18:24:27,102][09915] Multi agent env, num agents: 8 -[2023-09-12 18:24:27,141][09915] Multi agent env, num agents: 8 -[2023-09-12 18:24:27,180][09915] Port 40902 is available -[2023-09-12 18:24:27,180][09915] Using port 40902 -[2023-09-12 18:24:27,180][09915] Initializing env for player 0, init_info: {'port': 40902}... -[2023-09-12 18:24:27,193][09822] Initialized w:1 v:2 player:2 -[2023-09-12 18:24:27,195][09822] Initialized w:1 v:2 player:6 -[2023-09-12 18:24:27,195][09822] Initialized w:1 v:2 player:4 -[2023-09-12 18:24:27,195][09822] Initialized w:1 v:2 player:7 -[2023-09-12 18:24:27,195][09822] Initialized w:1 v:2 player:3 -[2023-09-12 18:24:27,196][09822] Initialized w:1 v:2 player:0 -[2023-09-12 18:24:27,196][09822] Initialized w:1 v:2 player:1 -[2023-09-12 18:24:27,196][09822] Initialized w:1 v:2 player:5 -[2023-09-12 18:24:27,201][09822] 8 agent workers initialized for env 1! -[2023-09-12 18:24:27,213][09915] Using port 40902 on host... -[2023-09-12 18:24:27,224][09860] Initializing env for player 0, init_info: {'port': 40602}... -[2023-09-12 18:24:27,231][09915] Initializing env for player 1, init_info: {'port': 40902}... -[2023-09-12 18:24:27,255][09822] Decorrelating experience for 64 frames... -[2023-09-12 18:24:27,258][09860] Using port 40602 on host... -[2023-09-12 18:24:27,272][09823] Initialized w:2 v:2 player:1 -[2023-09-12 18:24:27,274][09823] Initialized w:2 v:2 player:5 -[2023-09-12 18:24:27,275][09860] Initializing env for player 1, init_info: {'port': 40602}... -[2023-09-12 18:24:27,276][09823] Initialized w:2 v:2 player:7 -[2023-09-12 18:24:27,276][09823] Initialized w:2 v:2 player:2 -[2023-09-12 18:24:27,277][09823] Initialized w:2 v:2 player:4 -[2023-09-12 18:24:27,277][09823] Initialized w:2 v:2 player:6 -[2023-09-12 18:24:27,277][09823] Initialized w:2 v:2 player:0 -[2023-09-12 18:24:27,281][09915] Initializing env for player 2, init_info: {'port': 40902}... -[2023-09-12 18:24:27,325][09860] Initializing env for player 2, init_info: {'port': 40602}... -[2023-09-12 18:24:27,335][09915] Initializing env for player 3, init_info: {'port': 40902}... -[2023-09-12 18:24:27,383][09860] Initializing env for player 3, init_info: {'port': 40602}... -[2023-09-12 18:24:27,385][09915] Initializing env for player 4, init_info: {'port': 40902}... -[2023-09-12 18:24:27,443][09860] Initializing env for player 4, init_info: {'port': 40602}... -[2023-09-12 18:24:27,447][09915] Initializing env for player 5, init_info: {'port': 40902}... -[2023-09-12 18:24:27,495][09860] Initializing env for player 5, init_info: {'port': 40602}... -[2023-09-12 18:24:27,499][09915] Initializing env for player 6, init_info: {'port': 40902}... -[2023-09-12 18:24:27,555][09860] Initializing env for player 6, init_info: {'port': 40602}... -[2023-09-12 18:24:27,571][09915] Initializing env for player 7, init_info: {'port': 40902}... -[2023-09-12 18:24:27,595][09860] Initializing env for player 7, init_info: {'port': 40602}... -[2023-09-12 18:24:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:24:28,052][09822] Port 40403 is available -[2023-09-12 18:24:28,052][09822] Using port 40403 -[2023-09-12 18:24:28,053][09822] Initializing env for player 0, init_info: {'port': 40403}... -[2023-09-12 18:24:28,086][09821] Initialized w:0 v:2 player:7 -[2023-09-12 18:24:28,096][09822] Using port 40403 on host... -[2023-09-12 18:24:28,107][09855] Initialized w:4 v:2 player:3 -[2023-09-12 18:24:28,108][09855] Initialized w:4 v:2 player:5 -[2023-09-12 18:24:28,108][09855] Initialized w:4 v:2 player:4 -[2023-09-12 18:24:28,109][09822] Initializing env for player 1, init_info: {'port': 40403}... -[2023-09-12 18:24:28,110][09855] Initialized w:4 v:2 player:1 -[2023-09-12 18:24:28,110][09855] Initialized w:4 v:2 player:2 -[2023-09-12 18:24:28,110][09855] Initialized w:4 v:2 player:0 -[2023-09-12 18:24:28,111][09855] Initialized w:4 v:2 player:7 -[2023-09-12 18:24:28,111][09855] Initialized w:4 v:2 player:6 -[2023-09-12 18:24:28,112][09855] 8 agent workers initialized for env 4! -[2023-09-12 18:24:28,168][09822] Initializing env for player 2, init_info: {'port': 40403}... -[2023-09-12 18:24:28,173][09855] Decorrelating experience for 64 frames... -[2023-09-12 18:24:28,218][09822] Initializing env for player 3, init_info: {'port': 40403}... -[2023-09-12 18:24:28,271][09823] Initialized w:2 v:2 player:3 -[2023-09-12 18:24:28,272][09823] 8 agent workers initialized for env 2! -[2023-09-12 18:24:28,275][09822] Initializing env for player 4, init_info: {'port': 40403}... -[2023-09-12 18:24:28,342][09823] Decorrelating experience for 64 frames... -[2023-09-12 18:24:28,352][09822] Initializing env for player 5, init_info: {'port': 40403}... -[2023-09-12 18:24:28,413][09822] Initializing env for player 6, init_info: {'port': 40403}... -[2023-09-12 18:24:28,467][09822] Initializing env for player 7, init_info: {'port': 40403}... -[2023-09-12 18:24:28,841][09915] Initialized w:6 v:2 player:2 -[2023-09-12 18:24:28,843][09915] Initialized w:6 v:2 player:6 -[2023-09-12 18:24:28,844][09915] Initialized w:6 v:2 player:1 -[2023-09-12 18:24:28,844][09915] Initialized w:6 v:2 player:3 -[2023-09-12 18:24:28,844][09915] Initialized w:6 v:2 player:4 -[2023-09-12 18:24:28,846][09915] Initialized w:6 v:2 player:5 -[2023-09-12 18:24:28,847][09915] Initialized w:6 v:2 player:7 -[2023-09-12 18:24:28,848][09915] Initialized w:6 v:2 player:0 -[2023-09-12 18:24:28,849][09915] 8 agent workers initialized for env 6! -[2023-09-12 18:24:28,869][09855] Port 40703 is available -[2023-09-12 18:24:28,870][09855] Using port 40703 -[2023-09-12 18:24:28,870][09855] Initializing env for player 0, init_info: {'port': 40703}... -[2023-09-12 18:24:28,895][09860] Initialized w:3 v:2 player:1 -[2023-09-12 18:24:28,897][09860] Initialized w:3 v:2 player:3 -[2023-09-12 18:24:28,897][09860] Initialized w:3 v:2 player:5 -[2023-09-12 18:24:28,897][09860] Initialized w:3 v:2 player:2 -[2023-09-12 18:24:28,901][09855] Using port 40703 on host... -[2023-09-12 18:24:28,898][09860] Initialized w:3 v:2 player:7 -[2023-09-12 18:24:28,898][09860] Initialized w:3 v:2 player:6 -[2023-09-12 18:24:28,898][09860] Initialized w:3 v:2 player:4 -[2023-09-12 18:24:28,901][09860] Initialized w:3 v:2 player:0 -[2023-09-12 18:24:28,903][09860] 8 agent workers initialized for env 3! -[2023-09-12 18:24:28,913][09915] Decorrelating experience for 64 frames... -[2023-09-12 18:24:28,921][09855] Initializing env for player 1, init_info: {'port': 40703}... -[2023-09-12 18:24:28,937][09860] Decorrelating experience for 64 frames... -[2023-09-12 18:24:28,980][09855] Initializing env for player 2, init_info: {'port': 40703}... -[2023-09-12 18:24:28,999][09823] Port 40503 is available -[2023-09-12 18:24:28,999][09823] Using port 40503 -[2023-09-12 18:24:29,000][09823] Initializing env for player 0, init_info: {'port': 40503}... -[2023-09-12 18:24:29,030][09855] Initializing env for player 3, init_info: {'port': 40703}... -[2023-09-12 18:24:29,036][09823] Using port 40503 on host... -[2023-09-12 18:24:29,051][09823] Initializing env for player 1, init_info: {'port': 40503}... -[2023-09-12 18:24:29,085][09855] Initializing env for player 4, init_info: {'port': 40703}... -[2023-09-12 18:24:29,102][09823] Initializing env for player 2, init_info: {'port': 40503}... -[2023-09-12 18:24:29,135][09855] Initializing env for player 5, init_info: {'port': 40703}... -[2023-09-12 18:24:29,155][09823] Initializing env for player 3, init_info: {'port': 40503}... -[2023-09-12 18:24:29,199][09855] Initializing env for player 6, init_info: {'port': 40703}... -[2023-09-12 18:24:29,211][09823] Initializing env for player 4, init_info: {'port': 40503}... -[2023-09-12 18:24:29,239][09855] Initializing env for player 7, init_info: {'port': 40703}... -[2023-09-12 18:24:29,263][09823] Initializing env for player 5, init_info: {'port': 40503}... -[2023-09-12 18:24:29,319][09823] Initializing env for player 6, init_info: {'port': 40503}... -[2023-09-12 18:24:29,367][09823] Initializing env for player 7, init_info: {'port': 40503}... -[2023-09-12 18:24:29,660][09915] Port 40903 is available -[2023-09-12 18:24:29,660][09915] Using port 40903 -[2023-09-12 18:24:29,726][09860] Port 40603 is available -[2023-09-12 18:24:29,726][09860] Using port 40603 -[2023-09-12 18:24:29,726][09860] Initializing env for player 0, init_info: {'port': 40603}... -[2023-09-12 18:24:29,755][09860] Using port 40603 on host... -[2023-09-12 18:24:29,777][09860] Initializing env for player 1, init_info: {'port': 40603}... -[2023-09-12 18:24:29,801][09822] Initialized w:1 v:3 player:7 -[2023-09-12 18:24:29,802][09822] Initialized w:1 v:3 player:5 -[2023-09-12 18:24:29,802][09822] Initialized w:1 v:3 player:4 -[2023-09-12 18:24:29,802][09822] Initialized w:1 v:3 player:6 -[2023-09-12 18:24:29,802][09822] Initialized w:1 v:3 player:0 -[2023-09-12 18:24:29,803][09822] Initialized w:1 v:3 player:3 -[2023-09-12 18:24:29,803][09822] Initialized w:1 v:3 player:2 -[2023-09-12 18:24:29,803][09822] Initialized w:1 v:3 player:1 -[2023-09-12 18:24:29,805][09822] 8 agent workers initialized for env 1! -[2023-09-12 18:24:29,812][09915] Initializing env for player 0, init_info: {'port': 40903}... -[2023-09-12 18:24:29,839][09860] Initializing env for player 2, init_info: {'port': 40603}... -[2023-09-12 18:24:29,844][09915] Using port 40903 on host... -[2023-09-12 18:24:29,848][09822] Decorrelating experience for 96 frames... -[2023-09-12 18:24:29,863][09915] Initializing env for player 1, init_info: {'port': 40903}... -[2023-09-12 18:24:29,900][09860] Initializing env for player 3, init_info: {'port': 40603}... -[2023-09-12 18:24:29,913][09915] Initializing env for player 2, init_info: {'port': 40903}... -[2023-09-12 18:24:29,950][09860] Initializing env for player 4, init_info: {'port': 40603}... -[2023-09-12 18:24:29,967][09915] Initializing env for player 3, init_info: {'port': 40903}... -[2023-09-12 18:24:30,007][09860] Initializing env for player 5, init_info: {'port': 40603}... -[2023-09-12 18:24:30,019][09915] Initializing env for player 4, init_info: {'port': 40903}... -[2023-09-12 18:24:30,071][09915] Initializing env for player 5, init_info: {'port': 40903}... -[2023-09-12 18:24:30,076][09860] Initializing env for player 6, init_info: {'port': 40603}... -[2023-09-12 18:24:30,123][09860] Initializing env for player 7, init_info: {'port': 40603}... -[2023-09-12 18:24:30,151][09915] Initializing env for player 6, init_info: {'port': 40903}... -[2023-09-12 18:24:30,175][09915] Initializing env for player 7, init_info: {'port': 40903}... -[2023-09-12 18:24:30,602][09823] Initialized w:2 v:3 player:0 -[2023-09-12 18:24:30,606][09823] Initialized w:2 v:3 player:1 -[2023-09-12 18:24:30,607][09823] Initialized w:2 v:3 player:2 -[2023-09-12 18:24:30,607][09823] Initialized w:2 v:3 player:3 -[2023-09-12 18:24:30,607][09823] Initialized w:2 v:3 player:7 -[2023-09-12 18:24:30,607][09823] Initialized w:2 v:3 player:5 -[2023-09-12 18:24:30,607][09823] Initialized w:2 v:3 player:4 -[2023-09-12 18:24:30,607][09823] Initialized w:2 v:3 player:6 -[2023-09-12 18:24:30,609][09823] 8 agent workers initialized for env 2! -[2023-09-12 18:24:30,635][09855] Initialized w:4 v:3 player:3 -[2023-09-12 18:24:30,636][09855] Initialized w:4 v:3 player:0 -[2023-09-12 18:24:30,637][09855] Initialized w:4 v:3 player:2 -[2023-09-12 18:24:30,637][09855] Initialized w:4 v:3 player:1 -[2023-09-12 18:24:30,637][09855] Initialized w:4 v:3 player:6 -[2023-09-12 18:24:30,637][09855] Initialized w:4 v:3 player:4 -[2023-09-12 18:24:30,638][09855] Initialized w:4 v:3 player:7 -[2023-09-12 18:24:30,638][09855] Initialized w:4 v:3 player:5 -[2023-09-12 18:24:30,640][09855] 8 agent workers initialized for env 4! -[2023-09-12 18:24:30,655][09823] Decorrelating experience for 96 frames... -[2023-09-12 18:24:30,683][09855] Decorrelating experience for 96 frames... -[2023-09-12 18:24:31,332][09915] Initialized w:6 v:3 player:4 -[2023-09-12 18:24:31,333][09915] Initialized w:6 v:3 player:5 -[2023-09-12 18:24:31,334][09915] Initialized w:6 v:3 player:2 -[2023-09-12 18:24:31,334][09915] Initialized w:6 v:3 player:0 -[2023-09-12 18:24:31,334][09915] Initialized w:6 v:3 player:1 -[2023-09-12 18:24:31,334][09915] Initialized w:6 v:3 player:7 -[2023-09-12 18:24:31,334][09915] Initialized w:6 v:3 player:6 -[2023-09-12 18:24:31,334][09915] Initialized w:6 v:3 player:3 -[2023-09-12 18:24:31,338][09915] 8 agent workers initialized for env 6! -[2023-09-12 18:24:31,392][09915] Decorrelating experience for 96 frames... -[2023-09-12 18:24:31,427][09860] Initialized w:3 v:3 player:0 -[2023-09-12 18:24:31,429][09860] Initialized w:3 v:3 player:3 -[2023-09-12 18:24:31,429][09860] Initialized w:3 v:3 player:4 -[2023-09-12 18:24:31,429][09860] Initialized w:3 v:3 player:6 -[2023-09-12 18:24:31,430][09860] Initialized w:3 v:3 player:5 -[2023-09-12 18:24:31,431][09860] Initialized w:3 v:3 player:2 -[2023-09-12 18:24:31,431][09860] Initialized w:3 v:3 player:7 -[2023-09-12 18:24:32,425][09860] Initialized w:3 v:3 player:1 -[2023-09-12 18:24:32,426][09860] 8 agent workers initialized for env 3! -[2023-09-12 18:24:32,490][09860] Decorrelating experience for 96 frames... -[2023-09-12 18:24:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:24:33,098][09685] Signal inference workers to stop experience collection... -[2023-09-12 18:24:33,118][09820] InferenceWorker_p0-w0: stopping experience collection -[2023-09-12 18:24:34,302][09685] EvtLoop [learner_proc0_evt_loop, process=learner_proc0] unhandled exception in slot='on_new_training_batch' connected to emitter=Emitter(object_id='Batcher_0', signal_name='training_batches_available'), args=(0,) -Traceback (most recent call last): - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py", line 355, in _process_signal - slot_callable(*args) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner_worker.py", line 150, in on_new_training_batch - stats = self.learner.train(self.batcher.training_batches[batch_idx]) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 1046, in train - train_stats = self._train(buff, self.cfg.batch_size, experience_size, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 731, in _train - ) = self._calculate_losses(mb, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 649, in _calculate_losses - exploration_loss = self.exploration_loss_func(action_distribution, valids, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 477, in _symmetric_kl_exploration_loss - kl_prior = action_distribution.symmetric_kl_with_uniform_prior() - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py", line 247, in symmetric_kl_with_uniform_prior - sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions] - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py", line 247, in - sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions] -AttributeError: 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' -[2023-09-12 18:24:34,303][09685] Unhandled exception 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' in evt loop learner_proc0_evt_loop -[2023-09-12 18:24:36,010][129210] Heartbeat connected on Batcher_0 -[2023-09-12 18:24:36,016][129210] Heartbeat connected on InferenceWorker_p0-w0 -[2023-09-12 18:24:36,025][129210] Heartbeat connected on RolloutWorker_w1 -[2023-09-12 18:24:36,029][129210] Heartbeat connected on RolloutWorker_w2 -[2023-09-12 18:24:36,034][129210] Heartbeat connected on RolloutWorker_w3 -[2023-09-12 18:24:36,038][129210] Heartbeat connected on RolloutWorker_w4 -[2023-09-12 18:24:36,046][129210] Heartbeat connected on RolloutWorker_w6 -[2023-09-12 18:24:36,593][09916] Port 40802 is available -[2023-09-12 18:24:36,594][09916] Using port 40802 -[2023-09-12 18:24:36,594][09916] Initializing env for player 0, init_info: {'port': 40802}... -[2023-09-12 18:24:36,628][09916] Using port 40802 on host... -[2023-09-12 18:24:36,645][09916] Initializing env for player 1, init_info: {'port': 40802}... -[2023-09-12 18:24:36,695][09916] Initializing env for player 2, init_info: {'port': 40802}... -[2023-09-12 18:24:36,746][09916] Initializing env for player 3, init_info: {'port': 40802}... -[2023-09-12 18:24:36,803][09916] Initializing env for player 4, init_info: {'port': 40802}... -[2023-09-12 18:24:36,859][09916] Initializing env for player 5, init_info: {'port': 40802}... -[2023-09-12 18:24:36,915][09916] Initializing env for player 6, init_info: {'port': 40802}... -[2023-09-12 18:24:36,971][09916] Initializing env for player 7, init_info: {'port': 40802}... -[2023-09-12 18:24:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 206.6. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:24:38,190][09916] Initialized w:5 v:2 player:3 -[2023-09-12 18:24:38,193][09916] Initialized w:5 v:2 player:4 -[2023-09-12 18:24:38,193][09916] Initialized w:5 v:2 player:0 -[2023-09-12 18:24:38,193][09916] Initialized w:5 v:2 player:7 -[2023-09-12 18:24:38,193][09916] Initialized w:5 v:2 player:1 -[2023-09-12 18:24:38,194][09916] Initialized w:5 v:2 player:2 -[2023-09-12 18:24:38,194][09916] Initialized w:5 v:2 player:6 -[2023-09-12 18:24:38,194][09916] Initialized w:5 v:2 player:5 -[2023-09-12 18:24:38,196][09916] 8 agent workers initialized for env 5! -[2023-09-12 18:24:38,246][09916] Decorrelating experience for 64 frames... -[2023-09-12 18:24:38,744][09916] Port 40803 is available -[2023-09-12 18:24:38,744][09916] Using port 40803 -[2023-09-12 18:24:38,745][09916] Initializing env for player 0, init_info: {'port': 40803}... -[2023-09-12 18:24:38,773][09916] Using port 40803 on host... -[2023-09-12 18:24:38,796][09916] Initializing env for player 1, init_info: {'port': 40803}... -[2023-09-12 18:24:38,846][09916] Initializing env for player 2, init_info: {'port': 40803}... -[2023-09-12 18:24:38,897][09916] Initializing env for player 3, init_info: {'port': 40803}... -[2023-09-12 18:24:38,955][09916] Initializing env for player 4, init_info: {'port': 40803}... -[2023-09-12 18:24:39,011][09916] Initializing env for player 5, init_info: {'port': 40803}... -[2023-09-12 18:24:39,063][09916] Initializing env for player 6, init_info: {'port': 40803}... -[2023-09-12 18:24:39,131][09916] Initializing env for player 7, init_info: {'port': 40803}... -[2023-09-12 18:24:40,340][09916] Initialized w:5 v:3 player:1 -[2023-09-12 18:24:40,340][09916] Initialized w:5 v:3 player:4 -[2023-09-12 18:24:40,340][09916] Initialized w:5 v:3 player:0 -[2023-09-12 18:24:40,340][09916] Initialized w:5 v:3 player:6 -[2023-09-12 18:24:40,340][09916] Initialized w:5 v:3 player:3 -[2023-09-12 18:24:40,340][09916] Initialized w:5 v:3 player:7 -[2023-09-12 18:24:40,340][09916] Initialized w:5 v:3 player:2 -[2023-09-12 18:24:40,341][09916] Initialized w:5 v:3 player:5 -[2023-09-12 18:24:40,344][09916] 8 agent workers initialized for env 5! -[2023-09-12 18:24:40,387][09916] Decorrelating experience for 96 frames... -[2023-09-12 18:24:41,160][129210] Heartbeat connected on RolloutWorker_w5 -[2023-09-12 18:24:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 160.9. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:24:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 131.7. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:24:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 111.5. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:24:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 96.7. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:25:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 85.3. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:25:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 80.7. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:25:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 80.7. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:25:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 80.7. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:25:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:25:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:25:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:25:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:25:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:25:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:25:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:25:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:26:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:26:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:26:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:26:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:26:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:26:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:26:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:26:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:26:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:26:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:26:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:26:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:27:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:27:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:27:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:27:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:27:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:27:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:27:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:27:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:27:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:27:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:27:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:27:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:28:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:28:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:28:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:28:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:28:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:28:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:28:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:28:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:28:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:28:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:28:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:28:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:29:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:29:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:29:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:29:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:29:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:29:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:29:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:29:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:29:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:29:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:29:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:29:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:30:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:30:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:30:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:30:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:30:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:30:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:30:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:30:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:30:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:30:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:30:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:30:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:31:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:31:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:31:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:31:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:31:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:31:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:31:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:31:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:31:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:31:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:31:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:31:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:32:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:32:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:32:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:32:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:32:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:32:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:32:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:32:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:32:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:32:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:32:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:32:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:33:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:33:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:33:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:33:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:33:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:33:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:33:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:33:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:33:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:33:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:33:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:33:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:34:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:34:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:34:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:34:12,722][129210] Components not started: LearnerWorker_p0, RolloutWorker_w0, RolloutWorker_w7, wait_time=600.0 seconds -[2023-09-12 18:34:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:34:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:34:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:34:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:34:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:34:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:34:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:34:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:34:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:35:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:35:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:35:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:35:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:35:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:35:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:35:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:35:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:35:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:35:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:35:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:35:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:36:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:36:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:36:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:36:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:36:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:36:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:36:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:36:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:36:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:36:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:36:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:36:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:37:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:37:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:37:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:37:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:37:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:37:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:37:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:37:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:37:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:37:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:37:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:37:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:38:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:38:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:38:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:38:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:38:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:38:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:38:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:38:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:38:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:38:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:38:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:38:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:39:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:39:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:39:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:39:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:39:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:39:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:39:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:39:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:39:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:39:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:39:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:39:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:40:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:40:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:40:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:40:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:40:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:40:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:40:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:40:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:40:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:40:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:40:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:40:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:41:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:41:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:41:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:41:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:41:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:41:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:41:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:41:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:41:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:41:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:41:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:41:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:42:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:42:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:42:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:42:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:42:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:42:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:42:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:42:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:42:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:42:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:42:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:42:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:43:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:43:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:43:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:43:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:43:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:43:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:43:32,718][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:43:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:43:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:43:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:43:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:43:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:44:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:44:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:44:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:44:12,721][129210] Components not started: LearnerWorker_p0, RolloutWorker_w0, RolloutWorker_w7, wait_time=1200.0 seconds -[2023-09-12 18:44:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:44:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:44:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:44:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:44:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:44:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:44:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:44:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:44:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:45:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:45:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:45:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:45:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:45:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:45:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:45:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:45:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:45:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:45:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:45:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:45:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:46:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:46:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:46:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:46:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:46:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:46:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:46:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:46:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:46:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:46:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:46:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:46:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:47:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:47:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:47:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:47:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:47:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:47:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:47:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:47:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:47:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:47:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:47:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:47:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:48:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:48:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:48:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:48:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:48:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:48:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:48:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:48:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:48:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:48:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:48:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:48:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:49:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:49:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:49:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:49:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:49:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:49:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:49:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:49:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:49:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:49:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:49:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:49:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:50:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:50:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:50:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:50:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:50:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:50:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:50:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:50:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:50:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:50:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:50:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:50:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:51:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:51:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:51:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:51:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:51:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:51:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:51:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:51:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:51:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:51:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:51:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:51:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:52:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:52:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:52:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:52:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:52:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:52:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:52:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:52:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:52:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:52:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:52:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:52:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:53:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:53:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:53:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:53:17,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:53:22,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:53:27,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:53:32,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:53:37,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:53:42,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:53:47,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:53:52,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:53:57,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:54:02,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:54:07,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:54:12,716][129210] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 3632. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 18:54:12,719][129210] Components not started: LearnerWorker_p0, RolloutWorker_w0, RolloutWorker_w7, wait_time=1800.0 seconds -[2023-09-12 18:54:12,722][129210] Components take too long to start: LearnerWorker_p0, RolloutWorker_w0, RolloutWorker_w7. Aborting the experiment! - - - -[2023-09-12 18:54:12,725][09685] Stopping Batcher_0... -[2023-09-12 18:54:12,725][09685] Loop batcher_evt_loop terminating... -[2023-09-12 18:54:12,725][129210] Component Batcher_0 stopped! -[2023-09-12 18:54:12,727][129210] Waiting for ['LearnerWorker_p0', 'InferenceWorker_p0-w0', 'RolloutWorker_w0', 'RolloutWorker_w1', 'RolloutWorker_w2', 'RolloutWorker_w3', 'RolloutWorker_w4', 'RolloutWorker_w5', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... -[2023-09-12 18:54:12,743][09820] Weights refcount: 2 0 -[2023-09-12 18:54:12,744][09820] Stopping InferenceWorker_p0-w0... -[2023-09-12 18:54:12,744][09820] Loop inference_proc0-0_evt_loop terminating... -[2023-09-12 18:54:12,744][129210] Component InferenceWorker_p0-w0 stopped! -[2023-09-12 18:54:12,745][129210] Waiting for ['LearnerWorker_p0', 'RolloutWorker_w0', 'RolloutWorker_w1', 'RolloutWorker_w2', 'RolloutWorker_w3', 'RolloutWorker_w4', 'RolloutWorker_w5', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... -[2023-09-12 18:54:15,940][09822] Stopping RolloutWorker_w1... -[2023-09-12 18:54:15,941][09822] Loop rollout_proc1_evt_loop terminating... -[2023-09-12 18:54:15,941][09916] Stopping RolloutWorker_w5... -[2023-09-12 18:54:15,941][09823] Stopping RolloutWorker_w2... -[2023-09-12 18:54:15,941][09860] Stopping RolloutWorker_w3... -[2023-09-12 18:54:15,941][09916] Loop rollout_proc5_evt_loop terminating... -[2023-09-12 18:54:15,942][09823] Loop rollout_proc2_evt_loop terminating... -[2023-09-12 18:54:15,940][129210] Component LearnerWorker_p0 process died already! Don't wait for it. -[2023-09-12 18:54:15,942][09860] Loop rollout_proc3_evt_loop terminating... -[2023-09-12 18:54:15,942][09915] Stopping RolloutWorker_w6... -[2023-09-12 18:54:15,943][09855] Stopping RolloutWorker_w4... -[2023-09-12 18:54:15,943][09915] Loop rollout_proc6_evt_loop terminating... -[2023-09-12 18:54:15,943][09855] Loop rollout_proc4_evt_loop terminating... -[2023-09-12 18:54:15,942][129210] Component RolloutWorker_w1 stopped! -[2023-09-12 18:54:15,945][129210] Waiting for ['RolloutWorker_w0', 'RolloutWorker_w2', 'RolloutWorker_w3', 'RolloutWorker_w4', 'RolloutWorker_w5', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... -[2023-09-12 18:54:15,946][129210] Component RolloutWorker_w5 stopped! -[2023-09-12 18:54:15,947][129210] Waiting for ['RolloutWorker_w0', 'RolloutWorker_w2', 'RolloutWorker_w3', 'RolloutWorker_w4', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... -[2023-09-12 18:54:15,949][129210] Component RolloutWorker_w2 stopped! -[2023-09-12 18:54:15,950][129210] Waiting for ['RolloutWorker_w0', 'RolloutWorker_w3', 'RolloutWorker_w4', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... -[2023-09-12 18:54:15,951][129210] Component RolloutWorker_w3 stopped! -[2023-09-12 18:54:15,952][129210] Waiting for ['RolloutWorker_w0', 'RolloutWorker_w4', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... -[2023-09-12 18:54:15,953][129210] Component RolloutWorker_w6 stopped! -[2023-09-12 18:54:15,954][129210] Waiting for ['RolloutWorker_w0', 'RolloutWorker_w4', 'RolloutWorker_w7'] to stop... -[2023-09-12 18:54:15,955][129210] Component RolloutWorker_w4 stopped! -[2023-09-12 18:54:15,955][129210] Waiting for ['RolloutWorker_w0', 'RolloutWorker_w7'] to stop... -[2023-09-12 19:25:28,797][129210] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 129210], exiting... -[2023-09-12 19:25:28,800][09821] VizDoom game.init() threw an exception SignalException('Signal SIGINT received. ViZDoom instance has been closed.'). Terminate process... -[2023-09-12 19:25:28,800][09914] VizDoom game.init() threw an exception SignalException('Signal SIGINT received. ViZDoom instance has been closed.'). Terminate process... -[2023-09-12 19:25:28,800][129210] Runner profile tree view: -main_loop: 3672.7494 -[2023-09-12 19:25:28,802][09821] Failed with error RuntimeError('Critical error: worker stuck on initialization. Abort! '), trying again -[2023-09-12 19:25:28,802][129210] Collected {0: 0}, FPS: 0.0 -[2023-09-12 19:25:28,804][09914] Failed with error RuntimeError('Critical error: worker stuck on initialization. Abort! '), trying again -[2023-09-12 19:25:28,831][129210] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json -[2023-09-12 19:25:28,832][129210] Overriding arg 'num_workers' with value 1 passed from command line -[2023-09-12 19:25:28,833][129210] Adding new argument 'no_render'=True that is not in the saved config file! -[2023-09-12 19:25:28,834][129210] Adding new argument 'save_video'=True that is not in the saved config file! -[2023-09-12 19:25:28,834][129210] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file! -[2023-09-12 19:25:28,835][129210] Adding new argument 'video_name'=None that is not in the saved config file! -[2023-09-12 19:25:28,836][129210] Adding new argument 'max_num_frames'=100000 that is not in the saved config file! -[2023-09-12 19:25:28,837][129210] Adding new argument 'max_num_episodes'=10 that is not in the saved config file! -[2023-09-12 19:25:28,837][129210] Adding new argument 'push_to_hub'=True that is not in the saved config file! -[2023-09-12 19:25:28,838][129210] Adding new argument 'hf_repository'='MattStammers/vizdoom_fight' that is not in the saved config file! -[2023-09-12 19:25:28,839][129210] Adding new argument 'policy_index'=0 that is not in the saved config file! -[2023-09-12 19:25:28,840][129210] Adding new argument 'eval_deterministic'=False that is not in the saved config file! -[2023-09-12 19:25:28,841][129210] Adding new argument 'train_script'=None that is not in the saved config file! -[2023-09-12 19:25:28,841][129210] Adding new argument 'enjoy_script'=None that is not in the saved config file! -[2023-09-12 19:25:28,842][129210] Using frameskip 1 and render_action_repeat=4 for evaluation -[2023-09-12 19:25:28,842][129210] Multi agent env, num agents: 8 -[2023-09-12 19:25:28,872][129210] RunningMeanStd input shape: (23,) -[2023-09-12 19:25:28,874][129210] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 19:25:28,875][129210] RunningMeanStd input shape: (1,) -[2023-09-12 19:25:28,886][129210] ConvEncoder: input_channels=3 -[2023-09-12 19:25:28,929][129210] Conv encoder output size: 512 -[2023-09-12 19:25:28,931][129210] Policy head output size: 640 -[2023-09-12 19:25:28,956][129210] No checkpoints found -[2023-09-12 19:25:29,809][09821] Port 40302 is available -[2023-09-12 19:25:29,809][09821] Using port 40302 -[2023-09-12 19:25:29,810][09821] Initializing env for player 0, init_info: {'port': 40302}... -[2023-09-12 19:25:29,810][09914] Port 41001 is available -[2023-09-12 19:25:29,811][09914] Using port 41001 -[2023-09-12 19:25:29,812][09914] Initializing env for player 0, init_info: {'port': 41001}... -[2023-09-12 19:25:29,846][09821] Using port 40302 on host... -[2023-09-12 19:25:29,846][09914] Using port 41001 on host... -[2023-09-12 19:25:29,861][09821] Initializing env for player 1, init_info: {'port': 40302}... -[2023-09-12 19:25:29,863][09914] Initializing env for player 1, init_info: {'port': 41001}... -[2023-09-12 19:25:29,912][09821] Initializing env for player 2, init_info: {'port': 40302}... -[2023-09-12 19:25:29,913][09914] Initializing env for player 2, init_info: {'port': 41001}... -[2023-09-12 19:25:29,963][09821] Initializing env for player 3, init_info: {'port': 40302}... -[2023-09-12 19:25:29,963][09914] Initializing env for player 3, init_info: {'port': 41001}... -[2023-09-12 19:25:30,015][09914] Initializing env for player 4, init_info: {'port': 41001}... -[2023-09-12 19:25:30,019][09821] Initializing env for player 4, init_info: {'port': 40302}... -[2023-09-12 19:25:30,071][09914] Initializing env for player 5, init_info: {'port': 41001}... -[2023-09-12 19:25:30,070][09821] Initializing env for player 5, init_info: {'port': 40302}... -[2023-09-12 19:25:30,127][09914] Initializing env for player 6, init_info: {'port': 41001}... -[2023-09-12 19:25:30,127][09821] Initializing env for player 6, init_info: {'port': 40302}... -[2023-09-12 19:25:30,179][09914] Initializing env for player 7, init_info: {'port': 41001}... -[2023-09-12 19:25:30,179][09821] Initializing env for player 7, init_info: {'port': 40302}... -[2023-09-12 19:25:31,286][09821] Initialized w:0 v:2 player:4 -[2023-09-12 19:25:31,286][09821] Initialized w:0 v:2 player:3 -[2023-09-12 19:25:31,286][09821] Initialized w:0 v:2 player:7 -[2023-09-12 19:25:31,286][09821] Initialized w:0 v:2 player:1 -[2023-09-12 19:25:31,286][09821] Initialized w:0 v:2 player:2 -[2023-09-12 19:25:31,286][09821] Initialized w:0 v:2 player:0 -[2023-09-12 19:25:31,287][09821] Initialized w:0 v:2 player:6 -[2023-09-12 19:25:31,287][09821] Initialized w:0 v:2 player:5 -[2023-09-12 19:25:31,290][09821] 8 agent workers initialized for env 0! -[2023-09-12 19:25:31,336][09821] Decorrelating experience for 64 frames... -[2023-09-12 19:25:31,357][09914] Initialized w:7 v:1 player:3 -[2023-09-12 19:25:31,359][09914] Initialized w:7 v:1 player:2 -[2023-09-12 19:25:31,359][09914] Initialized w:7 v:1 player:1 -[2023-09-12 19:25:31,360][09914] Initialized w:7 v:1 player:5 -[2023-09-12 19:25:31,360][09914] Initialized w:7 v:1 player:4 -[2023-09-12 19:25:31,360][09914] Initialized w:7 v:1 player:6 -[2023-09-12 19:25:31,361][09914] Initialized w:7 v:1 player:0 -[2023-09-12 19:25:31,791][09821] Port 40303 is available -[2023-09-12 19:25:31,791][09821] Using port 40303 -[2023-09-12 19:25:31,792][09821] Initializing env for player 0, init_info: {'port': 40303}... -[2023-09-12 19:25:31,821][09821] Using port 40303 on host... -[2023-09-12 19:25:31,842][09821] Initializing env for player 1, init_info: {'port': 40303}... -[2023-09-12 19:25:31,893][09821] Initializing env for player 2, init_info: {'port': 40303}... -[2023-09-12 19:25:31,943][09821] Initializing env for player 3, init_info: {'port': 40303}... -[2023-09-12 19:25:32,003][09821] Initializing env for player 4, init_info: {'port': 40303}... -[2023-09-12 19:25:32,055][09821] Initializing env for player 5, init_info: {'port': 40303}... -[2023-09-12 19:25:32,115][09821] Initializing env for player 6, init_info: {'port': 40303}... -[2023-09-12 19:25:32,167][09821] Initializing env for player 7, init_info: {'port': 40303}... -[2023-09-12 19:25:32,357][09914] Initialized w:7 v:1 player:7 -[2023-09-12 19:25:32,358][09914] 8 agent workers initialized for env 7! -[2023-09-12 19:25:32,411][09914] Decorrelating experience for 32 frames... -[2023-09-12 19:25:32,710][09914] Multi agent env, num agents: 8 -[2023-09-12 19:25:32,739][09914] Multi agent env, num agents: 8 -[2023-09-12 19:25:32,768][09914] Port 41002 is available -[2023-09-12 19:25:32,768][09914] Using port 41002 -[2023-09-12 19:25:32,769][09914] Initializing env for player 0, init_info: {'port': 41002}... -[2023-09-12 19:25:32,803][09914] Using port 41002 on host... -[2023-09-12 19:25:32,819][09914] Initializing env for player 1, init_info: {'port': 41002}... -[2023-09-12 19:25:32,870][09914] Initializing env for player 2, init_info: {'port': 41002}... -[2023-09-12 19:25:32,930][09914] Initializing env for player 3, init_info: {'port': 41002}... -[2023-09-12 19:25:32,977][09914] Initializing env for player 4, init_info: {'port': 41002}... -[2023-09-12 19:25:33,039][09914] Initializing env for player 5, init_info: {'port': 41002}... -[2023-09-12 19:25:33,090][09914] Initializing env for player 6, init_info: {'port': 41002}... -[2023-09-12 19:25:33,143][09914] Initializing env for player 7, init_info: {'port': 41002}... -[2023-09-12 19:25:33,553][09821] Initialized w:0 v:3 player:3 -[2023-09-12 19:25:33,554][09821] Initialized w:0 v:3 player:6 -[2023-09-12 19:25:33,554][09821] Initialized w:0 v:3 player:7 -[2023-09-12 19:25:33,554][09821] Initialized w:0 v:3 player:2 -[2023-09-12 19:25:33,554][09821] Initialized w:0 v:3 player:5 -[2023-09-12 19:25:33,554][09821] Initialized w:0 v:3 player:0 -[2023-09-12 19:25:33,554][09821] Initialized w:0 v:3 player:1 -[2023-09-12 19:25:33,554][09821] Initialized w:0 v:3 player:4 -[2023-09-12 19:25:33,557][09821] 8 agent workers initialized for env 0! -[2023-09-12 19:25:33,607][09821] Decorrelating experience for 96 frames... -[2023-09-12 19:25:34,389][09914] Initialized w:7 v:2 player:2 -[2023-09-12 19:25:34,391][09914] Initialized w:7 v:2 player:3 -[2023-09-12 19:25:34,391][09914] Initialized w:7 v:2 player:7 -[2023-09-12 19:25:34,392][09914] Initialized w:7 v:2 player:1 -[2023-09-12 19:25:34,392][09914] Initialized w:7 v:2 player:6 -[2023-09-12 19:25:34,392][09914] Initialized w:7 v:2 player:4 -[2023-09-12 19:25:34,392][09914] Initialized w:7 v:2 player:5 -[2023-09-12 19:25:34,392][09914] Initialized w:7 v:2 player:0 -[2023-09-12 19:25:34,394][09914] 8 agent workers initialized for env 7! -[2023-09-12 19:25:34,445][09914] Decorrelating experience for 64 frames... -[2023-09-12 19:25:35,056][09914] Port 41003 is available -[2023-09-12 19:25:35,056][09914] Using port 41003 -[2023-09-12 19:25:35,056][09914] Initializing env for player 0, init_info: {'port': 41003}... -[2023-09-12 19:25:35,085][09914] Using port 41003 on host... -[2023-09-12 19:25:35,107][09914] Initializing env for player 1, init_info: {'port': 41003}... -[2023-09-12 19:25:35,158][09914] Initializing env for player 2, init_info: {'port': 41003}... -[2023-09-12 19:25:35,209][09914] Initializing env for player 3, init_info: {'port': 41003}... -[2023-09-12 19:25:35,259][09914] Initializing env for player 4, init_info: {'port': 41003}... -[2023-09-12 19:25:35,319][09914] Initializing env for player 5, init_info: {'port': 41003}... -[2023-09-12 19:25:35,375][09914] Initializing env for player 6, init_info: {'port': 41003}... -[2023-09-12 19:25:35,451][09914] Initializing env for player 7, init_info: {'port': 41003}... -[2023-09-12 19:25:36,598][09914] Initialized w:7 v:3 player:2 -[2023-09-12 19:25:36,599][09914] Initialized w:7 v:3 player:3 -[2023-09-12 19:25:36,600][09914] Initialized w:7 v:3 player:7 -[2023-09-12 19:25:36,600][09914] Initialized w:7 v:3 player:1 -[2023-09-12 19:25:36,600][09914] Initialized w:7 v:3 player:6 -[2023-09-12 19:25:36,600][09914] Initialized w:7 v:3 player:4 -[2023-09-12 19:25:36,600][09914] Initialized w:7 v:3 player:5 -[2023-09-12 19:25:36,601][09914] Initialized w:7 v:3 player:0 -[2023-09-12 19:25:36,602][09914] 8 agent workers initialized for env 7! -[2023-09-12 19:25:36,645][09914] Decorrelating experience for 96 frames... -[2023-09-12 19:25:37,751][09821] Stopping RolloutWorker_w0... -[2023-09-12 19:25:37,752][09821] Loop rollout_proc0_evt_loop terminating... -[2023-09-12 19:25:40,652][09914] Stopping RolloutWorker_w7... -[2023-09-12 19:25:40,654][09914] Loop rollout_proc7_evt_loop terminating... -[2023-09-12 19:27:27,076][45761] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... -[2023-09-12 19:27:28,113][45761] Rollout worker 0 uses device cpu -[2023-09-12 19:27:28,114][45761] Rollout worker 1 uses device cpu -[2023-09-12 19:27:28,115][45761] Rollout worker 2 uses device cpu -[2023-09-12 19:27:28,116][45761] Rollout worker 3 uses device cpu -[2023-09-12 19:27:28,117][45761] Rollout worker 4 uses device cpu -[2023-09-12 19:27:28,118][45761] Rollout worker 5 uses device cpu -[2023-09-12 19:27:28,119][45761] Rollout worker 6 uses device cpu -[2023-09-12 19:27:28,121][45761] Rollout worker 7 uses device cpu -[2023-09-12 19:27:28,310][45761] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 19:27:28,311][45761] InferenceWorker_p0-w0: min num requests: 2 -[2023-09-12 19:27:28,352][45761] Starting all processes... -[2023-09-12 19:27:28,353][45761] Starting process learner_proc0 -[2023-09-12 19:27:29,971][45761] Starting all processes... -[2023-09-12 19:27:29,972][47474] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 19:27:29,972][47474] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 -[2023-09-12 19:27:29,980][45761] Starting process inference_proc0-0 -[2023-09-12 19:27:29,980][45761] Starting process rollout_proc0 -[2023-09-12 19:27:29,981][45761] Starting process rollout_proc1 -[2023-09-12 19:27:29,981][45761] Starting process rollout_proc2 -[2023-09-12 19:27:29,982][45761] Starting process rollout_proc3 -[2023-09-12 19:27:29,983][45761] Starting process rollout_proc4 -[2023-09-12 19:27:29,984][45761] Starting process rollout_proc5 -[2023-09-12 19:27:30,010][47474] Num visible devices: 1 -[2023-09-12 19:27:30,052][47474] Starting seed is not provided -[2023-09-12 19:27:30,052][47474] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 19:27:30,052][47474] Initializing actor-critic model on device cuda:0 -[2023-09-12 19:27:30,052][47474] RunningMeanStd input shape: (23,) -[2023-09-12 19:27:30,053][47474] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 19:27:30,053][47474] RunningMeanStd input shape: (1,) -[2023-09-12 19:27:29,984][45761] Starting process rollout_proc6 -[2023-09-12 19:27:29,985][45761] Starting process rollout_proc7 -[2023-09-12 19:27:30,067][47474] ConvEncoder: input_channels=3 -[2023-09-12 19:27:30,299][47474] Conv encoder output size: 512 -[2023-09-12 19:27:30,300][47474] Policy head output size: 640 -[2023-09-12 19:27:30,318][47474] Created Actor Critic model with architecture: -[2023-09-12 19:27:30,318][47474] ActorCriticSharedWeights( - (obs_normalizer): ObservationNormalizer( - (running_mean_std): RunningMeanStdDictInPlace( - (running_mean_std): ModuleDict( - (measurements): RunningMeanStdInPlace() - (obs): RunningMeanStdInPlace() - ) - ) - ) - (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) - (encoder): VizdoomEncoder( - (basic_encoder): ConvEncoder( - (enc): RecursiveScriptModule( - original_name=ConvEncoderImpl - (conv_head): RecursiveScriptModule( - original_name=Sequential - (0): RecursiveScriptModule(original_name=Conv2d) - (1): RecursiveScriptModule(original_name=ELU) - (2): RecursiveScriptModule(original_name=Conv2d) - (3): RecursiveScriptModule(original_name=ELU) - (4): RecursiveScriptModule(original_name=Conv2d) - (5): RecursiveScriptModule(original_name=ELU) - ) - (mlp_layers): RecursiveScriptModule( - original_name=Sequential - (0): RecursiveScriptModule(original_name=Linear) - (1): RecursiveScriptModule(original_name=ELU) - ) - ) - ) - (measurements_head): Sequential( - (0): Linear(in_features=23, out_features=128, bias=True) - (1): ELU(alpha=1.0) - (2): Linear(in_features=128, out_features=128, bias=True) - (3): ELU(alpha=1.0) - ) - ) - (core): ModelCoreRNN( - (core): GRU(640, 512) - ) - (decoder): MlpDecoder( - (mlp): Identity() - ) - (critic_linear): Linear(in_features=512, out_features=1, bias=True) - (action_parameterization): ActionParameterizationDefault( - (distribution_linear): Linear(in_features=512, out_features=15, bias=True) - ) -) -[2023-09-12 19:27:31,551][47474] Using optimizer -[2023-09-12 19:27:31,551][47474] No checkpoints found -[2023-09-12 19:27:31,551][47474] Did not load from checkpoint, starting from scratch! -[2023-09-12 19:27:31,551][47474] Initialized policy 0 weights for model version 0 -[2023-09-12 19:27:31,553][47474] LearnerWorker_p0 finished initialization! -[2023-09-12 19:27:31,554][47474] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 19:27:31,975][47629] Worker 2 uses CPU cores [8, 9, 10, 11] -[2023-09-12 19:27:32,042][47594] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 19:27:32,042][47594] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 -[2023-09-12 19:27:32,060][47594] Num visible devices: 1 -[2023-09-12 19:27:32,062][47593] Worker 0 uses CPU cores [0, 1, 2, 3] -[2023-09-12 19:27:32,071][47627] Worker 1 uses CPU cores [4, 5, 6, 7] -[2023-09-12 19:27:32,155][47662] Worker 4 uses CPU cores [16, 17, 18, 19] -[2023-09-12 19:27:32,240][47630] Worker 5 uses CPU cores [20, 21, 22, 23] -[2023-09-12 19:27:32,280][47664] Worker 7 uses CPU cores [28, 29, 30, 31] -[2023-09-12 19:27:32,463][47628] Worker 3 uses CPU cores [12, 13, 14, 15] -[2023-09-12 19:27:32,576][47663] Worker 6 uses CPU cores [24, 25, 26, 27] -[2023-09-12 19:27:32,841][47594] RunningMeanStd input shape: (23,) -[2023-09-12 19:27:32,841][47594] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 19:27:32,842][47594] RunningMeanStd input shape: (1,) -[2023-09-12 19:27:32,853][47594] ConvEncoder: input_channels=3 -[2023-09-12 19:27:32,953][47594] Conv encoder output size: 512 -[2023-09-12 19:27:32,954][47594] Policy head output size: 640 -[2023-09-12 19:27:33,049][45761] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 0. Throughput: 0: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:27:33,301][45761] Inference worker 0-0 is ready! -[2023-09-12 19:27:33,302][45761] All inference workers are ready! Signal rollout workers to start! -[2023-09-12 19:27:33,306][47628] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,307][47664] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,307][47630] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,307][47629] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,307][47662] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,308][47593] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,308][47627] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,308][47663] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,340][47662] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 19:27:33,340][47664] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 19:27:33,340][47630] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 19:27:33,340][47593] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 19:27:33,341][47629] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 19:27:33,341][47627] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 19:27:33,343][47662] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,343][47630] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,343][47664] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,343][47593] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,344][47629] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,344][47627] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,349][47628] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 19:27:33,354][47663] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 19:27:33,354][47628] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,358][47663] Multi agent env, num agents: 8 -[2023-09-12 19:27:33,375][47664] Port 41000 is available -[2023-09-12 19:27:33,375][47664] Using port 41000 -[2023-09-12 19:27:33,375][47630] Port 40800 is available -[2023-09-12 19:27:33,375][47593] Port 40300 is available -[2023-09-12 19:27:33,375][47630] Using port 40800 -[2023-09-12 19:27:33,375][47593] Using port 40300 -[2023-09-12 19:27:33,375][47662] Port 40700 is available -[2023-09-12 19:27:33,375][47662] Using port 40700 -[2023-09-12 19:27:33,375][47627] Port 40400 is available -[2023-09-12 19:27:33,376][47627] Using port 40400 -[2023-09-12 19:27:33,376][47629] Port 40500 is available -[2023-09-12 19:27:33,376][47629] Using port 40500 -[2023-09-12 19:27:33,376][47664] Initializing env for player 0, init_info: {'port': 41000}... -[2023-09-12 19:27:33,376][47630] Initializing env for player 0, init_info: {'port': 40800}... -[2023-09-12 19:27:33,376][47662] Initializing env for player 0, init_info: {'port': 40700}... -[2023-09-12 19:27:33,376][47627] Initializing env for player 0, init_info: {'port': 40400}... -[2023-09-12 19:27:33,376][47593] Initializing env for player 0, init_info: {'port': 40300}... -[2023-09-12 19:27:33,389][47663] Port 40900 is available -[2023-09-12 19:27:33,389][47663] Using port 40900 -[2023-09-12 19:27:33,390][47663] Initializing env for player 0, init_info: {'port': 40900}... -[2023-09-12 19:27:33,399][47628] Port 40600 is available -[2023-09-12 19:27:33,399][47628] Using port 40600 -[2023-09-12 19:27:33,400][47628] Initializing env for player 0, init_info: {'port': 40600}... -[2023-09-12 19:27:33,405][47662] Using port 40700 on host... -[2023-09-12 19:27:33,405][47627] Using port 40400 on host... -[2023-09-12 19:27:33,405][47630] Using port 40800 on host... -[2023-09-12 19:27:33,410][47664] Using port 41000 on host... -[2023-09-12 19:27:33,410][47593] Using port 40300 on host... -[2023-09-12 19:27:33,419][47663] Using port 40900 on host... -[2023-09-12 19:27:33,426][47664] Initializing env for player 1, init_info: {'port': 41000}... -[2023-09-12 19:27:33,427][47630] Initializing env for player 1, init_info: {'port': 40800}... -[2023-09-12 19:27:33,427][47593] Initializing env for player 1, init_info: {'port': 40300}... -[2023-09-12 19:27:33,427][47662] Initializing env for player 1, init_info: {'port': 40700}... -[2023-09-12 19:27:33,427][47627] Initializing env for player 1, init_info: {'port': 40400}... -[2023-09-12 19:27:33,431][47628] Using port 40600 on host... -[2023-09-12 19:27:33,441][47663] Initializing env for player 1, init_info: {'port': 40900}... -[2023-09-12 19:27:33,451][47628] Initializing env for player 1, init_info: {'port': 40600}... -[2023-09-12 19:27:33,477][47664] Initializing env for player 2, init_info: {'port': 41000}... -[2023-09-12 19:27:33,477][47627] Initializing env for player 2, init_info: {'port': 40400}... -[2023-09-12 19:27:33,479][47593] Initializing env for player 2, init_info: {'port': 40300}... -[2023-09-12 19:27:33,479][47662] Initializing env for player 2, init_info: {'port': 40700}... -[2023-09-12 19:27:33,480][47630] Initializing env for player 2, init_info: {'port': 40800}... -[2023-09-12 19:27:33,491][47663] Initializing env for player 2, init_info: {'port': 40900}... -[2023-09-12 19:27:33,503][47628] Initializing env for player 2, init_info: {'port': 40600}... -[2023-09-12 19:27:33,529][47627] Initializing env for player 3, init_info: {'port': 40400}... -[2023-09-12 19:27:33,530][47630] Initializing env for player 3, init_info: {'port': 40800}... -[2023-09-12 19:27:33,532][47593] Initializing env for player 3, init_info: {'port': 40300}... -[2023-09-12 19:27:33,535][47664] Initializing env for player 3, init_info: {'port': 41000}... -[2023-09-12 19:27:33,535][47662] Initializing env for player 3, init_info: {'port': 40700}... -[2023-09-12 19:27:33,543][47663] Initializing env for player 3, init_info: {'port': 40900}... -[2023-09-12 19:27:33,560][47628] Initializing env for player 3, init_info: {'port': 40600}... -[2023-09-12 19:27:33,579][47664] Initializing env for player 4, init_info: {'port': 41000}... -[2023-09-12 19:27:33,582][47630] Initializing env for player 4, init_info: {'port': 40800}... -[2023-09-12 19:27:33,584][47627] Initializing env for player 4, init_info: {'port': 40400}... -[2023-09-12 19:27:33,591][47662] Initializing env for player 4, init_info: {'port': 40700}... -[2023-09-12 19:27:33,591][47593] Initializing env for player 4, init_info: {'port': 40300}... -[2023-09-12 19:27:33,607][47628] Initializing env for player 4, init_info: {'port': 40600}... -[2023-09-12 19:27:33,608][47663] Initializing env for player 4, init_info: {'port': 40900}... -[2023-09-12 19:27:33,638][47593] Initializing env for player 5, init_info: {'port': 40300}... -[2023-09-12 19:27:33,639][47664] Initializing env for player 5, init_info: {'port': 41000}... -[2023-09-12 19:27:33,640][47627] Initializing env for player 5, init_info: {'port': 40400}... -[2023-09-12 19:27:33,656][47628] Initializing env for player 5, init_info: {'port': 40600}... -[2023-09-12 19:27:33,663][47663] Initializing env for player 5, init_info: {'port': 40900}... -[2023-09-12 19:27:33,643][47662] Initializing env for player 5, init_info: {'port': 40700}... -[2023-09-12 19:27:33,667][47630] Initializing env for player 5, init_info: {'port': 40800}... -[2023-09-12 19:27:33,683][47664] Initializing env for player 6, init_info: {'port': 41000}... -[2023-09-12 19:27:33,687][47630] Initializing env for player 6, init_info: {'port': 40800}... -[2023-09-12 19:27:33,691][47627] Initializing env for player 6, init_info: {'port': 40400}... -[2023-09-12 19:27:33,694][47593] Initializing env for player 6, init_info: {'port': 40300}... -[2023-09-12 19:27:33,707][47662] Initializing env for player 6, init_info: {'port': 40700}... -[2023-09-12 19:27:33,715][47663] Initializing env for player 6, init_info: {'port': 40900}... -[2023-09-12 19:27:33,724][47628] Initializing env for player 6, init_info: {'port': 40600}... -[2023-09-12 19:27:33,731][47664] Initializing env for player 7, init_info: {'port': 41000}... -[2023-09-12 19:27:33,741][47593] Initializing env for player 7, init_info: {'port': 40300}... -[2023-09-12 19:27:33,743][47662] Initializing env for player 7, init_info: {'port': 40700}... -[2023-09-12 19:27:33,743][47627] Initializing env for player 7, init_info: {'port': 40400}... -[2023-09-12 19:27:33,756][47630] Initializing env for player 7, init_info: {'port': 40800}... -[2023-09-12 19:27:33,774][47628] Initializing env for player 7, init_info: {'port': 40600}... -[2023-09-12 19:27:33,775][47663] Initializing env for player 7, init_info: {'port': 40900}... -[2023-09-12 19:27:35,030][47663] Initialized w:6 v:0 player:2 -[2023-09-12 19:27:35,031][47663] Initialized w:6 v:0 player:5 -[2023-09-12 19:27:35,032][47663] Initialized w:6 v:0 player:1 -[2023-09-12 19:27:35,032][47663] Initialized w:6 v:0 player:0 -[2023-09-12 19:27:35,032][47663] Initialized w:6 v:0 player:4 -[2023-09-12 19:27:35,032][47663] Initialized w:6 v:0 player:6 -[2023-09-12 19:27:35,033][47663] Initialized w:6 v:0 player:7 -[2023-09-12 19:27:35,033][47663] Initialized w:6 v:0 player:3 -[2023-09-12 19:27:35,036][47663] 8 agent workers initialized for env 6! -[2023-09-12 19:27:35,083][47663] Decorrelating experience for 0 frames... -[2023-09-12 19:27:35,085][47663] Port 40901 is available -[2023-09-12 19:27:35,085][47663] Using port 40901 -[2023-09-12 19:27:35,151][47627] Initialized w:1 v:0 player:0 -[2023-09-12 19:27:35,152][47627] Initialized w:1 v:0 player:4 -[2023-09-12 19:27:35,152][47627] Initialized w:1 v:0 player:7 -[2023-09-12 19:27:35,152][47627] Initialized w:1 v:0 player:6 -[2023-09-12 19:27:35,152][47627] Initialized w:1 v:0 player:1 -[2023-09-12 19:27:35,152][47627] Initialized w:1 v:0 player:2 -[2023-09-12 19:27:35,153][47627] Initialized w:1 v:0 player:3 -[2023-09-12 19:27:35,153][47627] Initialized w:1 v:0 player:5 -[2023-09-12 19:27:35,155][47627] 8 agent workers initialized for env 1! -[2023-09-12 19:27:35,186][47663] Initializing env for player 0, init_info: {'port': 40901}... -[2023-09-12 19:27:35,199][47627] Decorrelating experience for 0 frames... -[2023-09-12 19:27:35,201][47627] Port 40401 is available -[2023-09-12 19:27:35,201][47627] Using port 40401 -[2023-09-12 19:27:35,201][47627] Initializing env for player 0, init_info: {'port': 40401}... -[2023-09-12 19:27:35,215][47664] Initialized w:7 v:0 player:6 -[2023-09-12 19:27:35,216][47664] Initialized w:7 v:0 player:5 -[2023-09-12 19:27:35,217][47664] Initialized w:7 v:0 player:4 -[2023-09-12 19:27:35,217][47664] Initialized w:7 v:0 player:1 -[2023-09-12 19:27:35,217][47664] Initialized w:7 v:0 player:0 -[2023-09-12 19:27:35,217][47664] Initialized w:7 v:0 player:2 -[2023-09-12 19:27:35,217][47664] Initialized w:7 v:0 player:7 -[2023-09-12 19:27:35,218][47664] Initialized w:7 v:0 player:3 -[2023-09-12 19:27:35,221][47664] 8 agent workers initialized for env 7! -[2023-09-12 19:27:35,222][47663] Using port 40901 on host... -[2023-09-12 19:27:35,237][47663] Initializing env for player 1, init_info: {'port': 40901}... -[2023-09-12 19:27:35,238][47627] Using port 40401 on host... -[2023-09-12 19:27:35,252][47627] Initializing env for player 1, init_info: {'port': 40401}... -[2023-09-12 19:27:35,268][47628] Initialized w:3 v:0 player:7 -[2023-09-12 19:27:35,270][47628] Initialized w:3 v:0 player:6 -[2023-09-12 19:27:35,270][47628] Initialized w:3 v:0 player:1 -[2023-09-12 19:27:35,270][47628] Initialized w:3 v:0 player:3 -[2023-09-12 19:27:35,270][47628] Initialized w:3 v:0 player:2 -[2023-09-12 19:27:35,270][47628] Initialized w:3 v:0 player:5 -[2023-09-12 19:27:35,270][47628] Initialized w:3 v:0 player:0 -[2023-09-12 19:27:35,270][47628] Initialized w:3 v:0 player:4 -[2023-09-12 19:27:35,274][47628] 8 agent workers initialized for env 3! -[2023-09-12 19:27:35,275][47664] Decorrelating experience for 0 frames... -[2023-09-12 19:27:35,277][47664] Port 41001 is available -[2023-09-12 19:27:35,277][47664] Using port 41001 -[2023-09-12 19:27:35,278][47664] Initializing env for player 0, init_info: {'port': 41001}... -[2023-09-12 19:27:35,282][47630] Initialized w:5 v:0 player:6 -[2023-09-12 19:27:35,283][47630] Initialized w:5 v:0 player:4 -[2023-09-12 19:27:35,285][47630] Initialized w:5 v:0 player:2 -[2023-09-12 19:27:35,285][47630] Initialized w:5 v:0 player:3 -[2023-09-12 19:27:35,285][47630] Initialized w:5 v:0 player:0 -[2023-09-12 19:27:35,285][47630] Initialized w:5 v:0 player:1 -[2023-09-12 19:27:35,285][47630] Initialized w:5 v:0 player:7 -[2023-09-12 19:27:35,286][47630] Initialized w:5 v:0 player:5 -[2023-09-12 19:27:35,288][47630] 8 agent workers initialized for env 5! -[2023-09-12 19:27:35,295][47663] Initializing env for player 2, init_info: {'port': 40901}... -[2023-09-12 19:27:35,305][47627] Initializing env for player 2, init_info: {'port': 40401}... -[2023-09-12 19:27:35,314][47593] Initialized w:0 v:0 player:3 -[2023-09-12 19:27:35,316][47593] Initialized w:0 v:0 player:2 -[2023-09-12 19:27:35,317][47593] Initialized w:0 v:0 player:6 -[2023-09-12 19:27:35,317][47593] Initialized w:0 v:0 player:7 -[2023-09-12 19:27:35,317][47593] Initialized w:0 v:0 player:0 -[2023-09-12 19:27:35,317][47593] Initialized w:0 v:0 player:1 -[2023-09-12 19:27:35,318][47593] Initialized w:0 v:0 player:5 -[2023-09-12 19:27:35,318][47593] Initialized w:0 v:0 player:4 -[2023-09-12 19:27:35,320][47593] 8 agent workers initialized for env 0! -[2023-09-12 19:27:35,321][47664] Using port 41001 on host... -[2023-09-12 19:27:35,325][47628] Decorrelating experience for 0 frames... -[2023-09-12 19:27:35,326][47628] Port 40601 is available -[2023-09-12 19:27:35,326][47628] Using port 40601 -[2023-09-12 19:27:35,327][47628] Initializing env for player 0, init_info: {'port': 40601}... -[2023-09-12 19:27:35,329][47664] Initializing env for player 1, init_info: {'port': 41001}... -[2023-09-12 19:27:35,333][47630] Decorrelating experience for 0 frames... -[2023-09-12 19:27:35,336][47630] Port 40801 is available -[2023-09-12 19:27:35,336][47630] Using port 40801 -[2023-09-12 19:27:35,337][47630] Initializing env for player 0, init_info: {'port': 40801}... -[2023-09-12 19:27:35,355][47663] Initializing env for player 3, init_info: {'port': 40901}... -[2023-09-12 19:27:35,356][47627] Initializing env for player 3, init_info: {'port': 40401}... -[2023-09-12 19:27:35,357][47628] Using port 40601 on host... -[2023-09-12 19:27:35,360][47593] Decorrelating experience for 0 frames... -[2023-09-12 19:27:35,362][47593] Port 40301 is available -[2023-09-12 19:27:35,362][47593] Using port 40301 -[2023-09-12 19:27:35,363][47593] Initializing env for player 0, init_info: {'port': 40301}... -[2023-09-12 19:27:35,372][47630] Using port 40801 on host... -[2023-09-12 19:27:35,377][47628] Initializing env for player 1, init_info: {'port': 40601}... -[2023-09-12 19:27:35,379][47664] Initializing env for player 2, init_info: {'port': 41001}... -[2023-09-12 19:27:35,391][47630] Initializing env for player 1, init_info: {'port': 40801}... -[2023-09-12 19:27:35,396][47662] Initialized w:4 v:0 player:5 -[2023-09-12 19:27:35,399][47663] Initializing env for player 4, init_info: {'port': 40901}... -[2023-09-12 19:27:35,399][47662] Initialized w:4 v:0 player:6 -[2023-09-12 19:27:35,399][47662] Initialized w:4 v:0 player:7 -[2023-09-12 19:27:35,399][47662] Initialized w:4 v:0 player:4 -[2023-09-12 19:27:35,399][47662] Initialized w:4 v:0 player:1 -[2023-09-12 19:27:35,399][47662] Initialized w:4 v:0 player:2 -[2023-09-12 19:27:35,400][47662] Initialized w:4 v:0 player:0 -[2023-09-12 19:27:35,400][47662] Initialized w:4 v:0 player:3 -[2023-09-12 19:27:35,403][47662] 8 agent workers initialized for env 4! -[2023-09-12 19:27:35,406][47627] Initializing env for player 4, init_info: {'port': 40401}... -[2023-09-12 19:27:35,414][47593] Initializing env for player 1, init_info: {'port': 40301}... -[2023-09-12 19:27:35,428][47628] Initializing env for player 2, init_info: {'port': 40601}... -[2023-09-12 19:27:35,429][47664] Initializing env for player 3, init_info: {'port': 41001}... -[2023-09-12 19:27:35,436][47593] Using port 40301 on host... -[2023-09-12 19:27:35,448][47630] Initializing env for player 2, init_info: {'port': 40801}... -[2023-09-12 19:27:35,457][47627] Initializing env for player 5, init_info: {'port': 40401}... -[2023-09-12 19:27:35,464][47593] Initializing env for player 2, init_info: {'port': 40301}... -[2023-09-12 19:27:35,467][47663] Initializing env for player 5, init_info: {'port': 40901}... -[2023-09-12 19:27:35,475][47662] Decorrelating experience for 0 frames... -[2023-09-12 19:27:35,477][47662] Port 40701 is available -[2023-09-12 19:27:35,477][47662] Using port 40701 -[2023-09-12 19:27:35,479][47628] Initializing env for player 3, init_info: {'port': 40601}... -[2023-09-12 19:27:35,487][47664] Initializing env for player 4, init_info: {'port': 41001}... -[2023-09-12 19:27:35,501][47630] Initializing env for player 3, init_info: {'port': 40801}... -[2023-09-12 19:27:35,511][47627] Initializing env for player 6, init_info: {'port': 40401}... -[2023-09-12 19:27:35,519][47663] Initializing env for player 6, init_info: {'port': 40901}... -[2023-09-12 19:27:35,519][47593] Initializing env for player 3, init_info: {'port': 40301}... -[2023-09-12 19:27:35,535][47664] Initializing env for player 5, init_info: {'port': 41001}... -[2023-09-12 19:27:35,539][47628] Initializing env for player 4, init_info: {'port': 40601}... -[2023-09-12 19:27:35,551][47630] Initializing env for player 4, init_info: {'port': 40801}... -[2023-09-12 19:27:35,566][47627] Initializing env for player 7, init_info: {'port': 40401}... -[2023-09-12 19:27:35,571][47593] Initializing env for player 4, init_info: {'port': 40301}... -[2023-09-12 19:27:35,571][47663] Initializing env for player 7, init_info: {'port': 40901}... -[2023-09-12 19:27:35,587][47664] Initializing env for player 6, init_info: {'port': 41001}... -[2023-09-12 19:27:35,597][47628] Initializing env for player 5, init_info: {'port': 40601}... -[2023-09-12 19:27:35,603][47630] Initializing env for player 5, init_info: {'port': 40801}... -[2023-09-12 19:27:35,623][47593] Initializing env for player 5, init_info: {'port': 40301}... -[2023-09-12 19:27:35,635][47664] Initializing env for player 7, init_info: {'port': 41001}... -[2023-09-12 19:27:35,635][47628] Initializing env for player 6, init_info: {'port': 40601}... -[2023-09-12 19:27:35,655][47630] Initializing env for player 6, init_info: {'port': 40801}... -[2023-09-12 19:27:35,679][47593] Initializing env for player 6, init_info: {'port': 40301}... -[2023-09-12 19:27:35,687][47628] Initializing env for player 7, init_info: {'port': 40601}... -[2023-09-12 19:27:35,735][47593] Initializing env for player 7, init_info: {'port': 40301}... -[2023-09-12 19:27:35,756][47630] Initializing env for player 7, init_info: {'port': 40801}... -[2023-09-12 19:27:37,019][47663] Initialized w:6 v:1 player:1 -[2023-09-12 19:27:37,020][47663] Initialized w:6 v:1 player:0 -[2023-09-12 19:27:37,020][47663] Initialized w:6 v:1 player:2 -[2023-09-12 19:27:37,020][47663] Initialized w:6 v:1 player:3 -[2023-09-12 19:27:37,023][47663] Initialized w:6 v:1 player:4 -[2023-09-12 19:27:37,024][47663] Initialized w:6 v:1 player:6 -[2023-09-12 19:27:37,027][47663] Initialized w:6 v:1 player:7 -[2023-09-12 19:27:37,139][47593] Initialized w:0 v:1 player:5 -[2023-09-12 19:27:37,142][47593] Initialized w:0 v:1 player:1 -[2023-09-12 19:27:37,142][47593] Initialized w:0 v:1 player:6 -[2023-09-12 19:27:37,142][47593] Initialized w:0 v:1 player:4 -[2023-09-12 19:27:37,142][47593] Initialized w:0 v:1 player:2 -[2023-09-12 19:27:37,143][47593] Initialized w:0 v:1 player:3 -[2023-09-12 19:27:37,143][47593] Initialized w:0 v:1 player:0 -[2023-09-12 19:27:37,143][47593] Initialized w:0 v:1 player:7 -[2023-09-12 19:27:37,146][47593] 8 agent workers initialized for env 0! -[2023-09-12 19:27:37,159][47627] Initialized w:1 v:1 player:7 -[2023-09-12 19:27:37,162][47627] Initialized w:1 v:1 player:5 -[2023-09-12 19:27:37,162][47627] Initialized w:1 v:1 player:3 -[2023-09-12 19:27:37,162][47627] Initialized w:1 v:1 player:6 -[2023-09-12 19:27:37,162][47627] Initialized w:1 v:1 player:1 -[2023-09-12 19:27:37,163][47627] Initialized w:1 v:1 player:4 -[2023-09-12 19:27:37,164][47627] Initialized w:1 v:1 player:2 -[2023-09-12 19:27:37,165][47627] Initialized w:1 v:1 player:0 -[2023-09-12 19:27:37,167][47627] 8 agent workers initialized for env 1! -[2023-09-12 19:27:37,199][47593] Decorrelating experience for 32 frames... -[2023-09-12 19:27:37,202][47664] Initialized w:7 v:1 player:0 -[2023-09-12 19:27:37,203][47664] Initialized w:7 v:1 player:6 -[2023-09-12 19:27:37,203][47664] Initialized w:7 v:1 player:1 -[2023-09-12 19:27:37,205][47664] Initialized w:7 v:1 player:5 -[2023-09-12 19:27:37,205][47664] Initialized w:7 v:1 player:7 -[2023-09-12 19:27:37,205][47664] Initialized w:7 v:1 player:3 -[2023-09-12 19:27:37,207][47664] Initialized w:7 v:1 player:2 -[2023-09-12 19:27:37,207][47664] Initialized w:7 v:1 player:4 -[2023-09-12 19:27:37,208][47664] 8 agent workers initialized for env 7! -[2023-09-12 19:27:37,226][47630] Initialized w:5 v:1 player:7 -[2023-09-12 19:27:37,228][47630] Initialized w:5 v:1 player:1 -[2023-09-12 19:27:37,229][47630] Initialized w:5 v:1 player:0 -[2023-09-12 19:27:37,230][47630] Initialized w:5 v:1 player:5 -[2023-09-12 19:27:37,231][47630] Initialized w:5 v:1 player:4 -[2023-09-12 19:27:37,231][47630] Initialized w:5 v:1 player:2 -[2023-09-12 19:27:37,231][47630] Initialized w:5 v:1 player:3 -[2023-09-12 19:27:37,232][47627] Decorrelating experience for 32 frames... -[2023-09-12 19:27:37,232][47630] Initialized w:5 v:1 player:6 -[2023-09-12 19:27:37,233][47630] 8 agent workers initialized for env 5! -[2023-09-12 19:27:37,252][47628] Initialized w:3 v:1 player:3 -[2023-09-12 19:27:37,254][47628] Initialized w:3 v:1 player:7 -[2023-09-12 19:27:37,254][47628] Initialized w:3 v:1 player:2 -[2023-09-12 19:27:37,254][47628] Initialized w:3 v:1 player:1 -[2023-09-12 19:27:37,254][47628] Initialized w:3 v:1 player:0 -[2023-09-12 19:27:37,254][47628] Initialized w:3 v:1 player:6 -[2023-09-12 19:27:37,254][47628] Initialized w:3 v:1 player:4 -[2023-09-12 19:27:37,254][47628] Initialized w:3 v:1 player:5 -[2023-09-12 19:27:37,258][47628] 8 agent workers initialized for env 3! -[2023-09-12 19:27:37,260][47664] Decorrelating experience for 32 frames... -[2023-09-12 19:27:37,288][47630] Decorrelating experience for 32 frames... -[2023-09-12 19:27:37,311][47628] Decorrelating experience for 32 frames... -[2023-09-12 19:27:37,577][47593] Multi agent env, num agents: 8 -[2023-09-12 19:27:37,607][47593] Multi agent env, num agents: 8 -[2023-09-12 19:27:37,611][47664] Multi agent env, num agents: 8 -[2023-09-12 19:27:37,638][47593] Port 40302 is available -[2023-09-12 19:27:37,639][47593] Using port 40302 -[2023-09-12 19:27:37,640][47593] Initializing env for player 0, init_info: {'port': 40302}... -[2023-09-12 19:27:37,651][47664] Multi agent env, num agents: 8 -[2023-09-12 19:27:37,660][47628] Multi agent env, num agents: 8 -[2023-09-12 19:27:37,669][47593] Using port 40302 on host... -[2023-09-12 19:27:37,682][47664] Port 41002 is available -[2023-09-12 19:27:37,682][47664] Using port 41002 -[2023-09-12 19:27:37,683][47664] Initializing env for player 0, init_info: {'port': 41002}... -[2023-09-12 19:27:37,691][47628] Multi agent env, num agents: 8 -[2023-09-12 19:27:37,690][47593] Initializing env for player 1, init_info: {'port': 40302}... -[2023-09-12 19:27:37,698][47630] Multi agent env, num agents: 8 -[2023-09-12 19:27:37,714][47664] Using port 41002 on host... -[2023-09-12 19:27:37,722][47628] Port 40602 is available -[2023-09-12 19:27:37,722][47628] Using port 40602 -[2023-09-12 19:27:37,723][47628] Initializing env for player 0, init_info: {'port': 40602}... -[2023-09-12 19:27:37,733][47664] Initializing env for player 1, init_info: {'port': 41002}... -[2023-09-12 19:27:37,735][47627] Multi agent env, num agents: 8 -[2023-09-12 19:27:37,739][47630] Multi agent env, num agents: 8 -[2023-09-12 19:27:37,747][47593] Initializing env for player 2, init_info: {'port': 40302}... -[2023-09-12 19:27:37,755][47628] Using port 40602 on host... -[2023-09-12 19:27:37,767][47627] Multi agent env, num agents: 8 -[2023-09-12 19:27:37,769][47630] Port 40802 is available -[2023-09-12 19:27:37,769][47630] Using port 40802 -[2023-09-12 19:27:37,769][47630] Initializing env for player 0, init_info: {'port': 40802}... -[2023-09-12 19:27:37,774][47628] Initializing env for player 1, init_info: {'port': 40602}... -[2023-09-12 19:27:37,784][47664] Initializing env for player 2, init_info: {'port': 41002}... -[2023-09-12 19:27:37,797][47630] Using port 40802 on host... -[2023-09-12 19:27:37,798][47627] Port 40402 is available -[2023-09-12 19:27:37,798][47627] Using port 40402 -[2023-09-12 19:27:37,797][47593] Initializing env for player 3, init_info: {'port': 40302}... -[2023-09-12 19:27:37,798][47627] Initializing env for player 0, init_info: {'port': 40402}... -[2023-09-12 19:27:37,820][47630] Initializing env for player 1, init_info: {'port': 40802}... -[2023-09-12 19:27:37,829][47627] Using port 40402 on host... -[2023-09-12 19:27:37,831][47628] Initializing env for player 2, init_info: {'port': 40602}... -[2023-09-12 19:27:37,834][47664] Initializing env for player 3, init_info: {'port': 41002}... -[2023-09-12 19:27:37,849][47627] Initializing env for player 1, init_info: {'port': 40402}... -[2023-09-12 19:27:37,856][47593] Initializing env for player 4, init_info: {'port': 40302}... -[2023-09-12 19:27:37,870][47630] Initializing env for player 2, init_info: {'port': 40802}... -[2023-09-12 19:27:37,888][47628] Initializing env for player 3, init_info: {'port': 40602}... -[2023-09-12 19:27:37,891][47664] Initializing env for player 4, init_info: {'port': 41002}... -[2023-09-12 19:27:37,900][47627] Initializing env for player 2, init_info: {'port': 40402}... -[2023-09-12 19:27:37,911][47593] Initializing env for player 5, init_info: {'port': 40302}... -[2023-09-12 19:27:37,921][47630] Initializing env for player 3, init_info: {'port': 40802}... -[2023-09-12 19:27:37,939][47628] Initializing env for player 4, init_info: {'port': 40602}... -[2023-09-12 19:27:37,939][47664] Initializing env for player 5, init_info: {'port': 41002}... -[2023-09-12 19:27:37,953][47627] Initializing env for player 3, init_info: {'port': 40402}... -[2023-09-12 19:27:37,959][47593] Initializing env for player 6, init_info: {'port': 40302}... -[2023-09-12 19:27:37,979][47630] Initializing env for player 4, init_info: {'port': 40802}... -[2023-09-12 19:27:37,995][47628] Initializing env for player 5, init_info: {'port': 40602}... -[2023-09-12 19:27:38,011][47627] Initializing env for player 4, init_info: {'port': 40402}... -[2023-09-12 19:27:38,011][47664] Initializing env for player 6, init_info: {'port': 41002}... -[2023-09-12 19:27:38,018][47663] Initialized w:6 v:1 player:5 -[2023-09-12 19:27:38,021][47663] 8 agent workers initialized for env 6! -[2023-09-12 19:27:38,031][47630] Initializing env for player 5, init_info: {'port': 40802}... -[2023-09-12 19:27:38,038][47629] Initializing env for player 0, init_info: {'port': 40500}... -[2023-09-12 19:27:38,047][47628] Initializing env for player 6, init_info: {'port': 40602}... -[2023-09-12 19:27:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:27:38,071][47627] Initializing env for player 5, init_info: {'port': 40402}... -[2023-09-12 19:27:38,071][47664] Initializing env for player 7, init_info: {'port': 41002}... -[2023-09-12 19:27:38,084][47629] Using port 40500 on host... -[2023-09-12 19:27:38,091][47629] Initializing env for player 1, init_info: {'port': 40500}... -[2023-09-12 19:27:38,091][47630] Initializing env for player 6, init_info: {'port': 40802}... -[2023-09-12 19:27:38,043][47593] Initializing env for player 7, init_info: {'port': 40302}... -[2023-09-12 19:27:38,119][47627] Initializing env for player 6, init_info: {'port': 40402}... -[2023-09-12 19:27:38,122][47628] Initializing env for player 7, init_info: {'port': 40602}... -[2023-09-12 19:27:38,142][47629] Initializing env for player 2, init_info: {'port': 40500}... -[2023-09-12 19:27:38,155][47630] Initializing env for player 7, init_info: {'port': 40802}... -[2023-09-12 19:27:38,182][47663] Decorrelating experience for 32 frames... -[2023-09-12 19:27:38,179][47627] Initializing env for player 7, init_info: {'port': 40402}... -[2023-09-12 19:27:38,195][47629] Initializing env for player 3, init_info: {'port': 40500}... -[2023-09-12 19:27:38,258][47629] Initializing env for player 4, init_info: {'port': 40500}... -[2023-09-12 19:27:38,305][47629] Initializing env for player 5, init_info: {'port': 40500}... -[2023-09-12 19:27:38,359][47629] Initializing env for player 6, init_info: {'port': 40500}... -[2023-09-12 19:27:38,415][47629] Initializing env for player 7, init_info: {'port': 40500}... -[2023-09-12 19:27:38,800][47663] Multi agent env, num agents: 8 -[2023-09-12 19:27:38,846][47663] Multi agent env, num agents: 8 -[2023-09-12 19:27:38,893][47663] Port 40902 is available -[2023-09-12 19:27:38,893][47663] Using port 40902 -[2023-09-12 19:27:38,894][47663] Initializing env for player 0, init_info: {'port': 40902}... -[2023-09-12 19:27:38,938][47663] Using port 40902 on host... -[2023-09-12 19:27:38,944][47663] Initializing env for player 1, init_info: {'port': 40902}... -[2023-09-12 19:27:38,995][47663] Initializing env for player 2, init_info: {'port': 40902}... -[2023-09-12 19:27:39,045][47663] Initializing env for player 3, init_info: {'port': 40902}... -[2023-09-12 19:27:39,096][47663] Initializing env for player 4, init_info: {'port': 40902}... -[2023-09-12 19:27:39,149][47663] Initializing env for player 5, init_info: {'port': 40902}... -[2023-09-12 19:27:39,203][47663] Initializing env for player 6, init_info: {'port': 40902}... -[2023-09-12 19:27:39,255][47663] Initializing env for player 7, init_info: {'port': 40902}... -[2023-09-12 19:27:39,429][47593] Initialized w:0 v:2 player:1 -[2023-09-12 19:27:39,429][47593] Initialized w:0 v:2 player:6 -[2023-09-12 19:27:39,431][47593] Initialized w:0 v:2 player:2 -[2023-09-12 19:27:39,430][47593] Initialized w:0 v:2 player:0 -[2023-09-12 19:27:39,430][47593] Initialized w:0 v:2 player:3 -[2023-09-12 19:27:39,430][47593] Initialized w:0 v:2 player:5 -[2023-09-12 19:27:39,430][47593] Initialized w:0 v:2 player:7 -[2023-09-12 19:27:39,430][47593] Initialized w:0 v:2 player:4 -[2023-09-12 19:27:39,436][47593] 8 agent workers initialized for env 0! -[2023-09-12 19:27:39,490][47593] Decorrelating experience for 64 frames... -[2023-09-12 19:27:39,675][47664] Initialized w:7 v:2 player:1 -[2023-09-12 19:27:39,676][47664] Initialized w:7 v:2 player:7 -[2023-09-12 19:27:39,677][47664] Initialized w:7 v:2 player:3 -[2023-09-12 19:27:39,677][47664] Initialized w:7 v:2 player:2 -[2023-09-12 19:27:39,678][47664] Initialized w:7 v:2 player:6 -[2023-09-12 19:27:39,678][47664] Initialized w:7 v:2 player:0 -[2023-09-12 19:27:39,678][47664] Initialized w:7 v:2 player:4 -[2023-09-12 19:27:39,679][47664] Initialized w:7 v:2 player:5 -[2023-09-12 19:27:39,681][47664] 8 agent workers initialized for env 7! -[2023-09-12 19:27:39,683][47628] Initialized w:3 v:2 player:5 -[2023-09-12 19:27:39,684][47628] Initialized w:3 v:2 player:0 -[2023-09-12 19:27:39,684][47628] Initialized w:3 v:2 player:2 -[2023-09-12 19:27:39,686][47628] Initialized w:3 v:2 player:6 -[2023-09-12 19:27:39,685][47628] Initialized w:3 v:2 player:1 -[2023-09-12 19:27:39,685][47628] Initialized w:3 v:2 player:7 -[2023-09-12 19:27:39,685][47628] Initialized w:3 v:2 player:3 -[2023-09-12 19:27:39,684][47628] Initialized w:3 v:2 player:4 -[2023-09-12 19:27:39,688][47628] 8 agent workers initialized for env 3! -[2023-09-12 19:27:39,699][47630] Initialized w:5 v:2 player:0 -[2023-09-12 19:27:39,700][47630] Initialized w:5 v:2 player:2 -[2023-09-12 19:27:39,701][47630] Initialized w:5 v:2 player:6 -[2023-09-12 19:27:39,703][47630] Initialized w:5 v:2 player:3 -[2023-09-12 19:27:39,703][47630] Initialized w:5 v:2 player:1 -[2023-09-12 19:27:39,703][47630] Initialized w:5 v:2 player:5 -[2023-09-12 19:27:39,703][47630] Initialized w:5 v:2 player:4 -[2023-09-12 19:27:39,704][47630] Initialized w:5 v:2 player:7 -[2023-09-12 19:27:39,706][47630] 8 agent workers initialized for env 5! -[2023-09-12 19:27:39,718][47664] Decorrelating experience for 64 frames... -[2023-09-12 19:27:39,737][47628] Decorrelating experience for 64 frames... -[2023-09-12 19:27:39,758][47630] Decorrelating experience for 64 frames... -[2023-09-12 19:27:39,756][47627] Initialized w:1 v:2 player:3 -[2023-09-12 19:27:39,759][47627] Initialized w:1 v:2 player:2 -[2023-09-12 19:27:39,759][47627] Initialized w:1 v:2 player:1 -[2023-09-12 19:27:39,759][47627] Initialized w:1 v:2 player:5 -[2023-09-12 19:27:39,759][47627] Initialized w:1 v:2 player:4 -[2023-09-12 19:27:39,760][47627] Initialized w:1 v:2 player:0 -[2023-09-12 19:27:39,760][47627] Initialized w:1 v:2 player:7 -[2023-09-12 19:27:39,760][47627] Initialized w:1 v:2 player:6 -[2023-09-12 19:27:39,763][47627] 8 agent workers initialized for env 1! -[2023-09-12 19:27:39,811][47627] Decorrelating experience for 64 frames... -[2023-09-12 19:27:39,874][47629] Initialized w:2 v:0 player:4 -[2023-09-12 19:27:39,875][47629] Initialized w:2 v:0 player:7 -[2023-09-12 19:27:39,876][47629] Initialized w:2 v:0 player:1 -[2023-09-12 19:27:39,876][47629] Initialized w:2 v:0 player:0 -[2023-09-12 19:27:39,876][47629] Initialized w:2 v:0 player:3 -[2023-09-12 19:27:39,876][47629] Initialized w:2 v:0 player:6 -[2023-09-12 19:27:39,878][47629] Initialized w:2 v:0 player:5 -[2023-09-12 19:27:39,878][47629] Initialized w:2 v:0 player:2 -[2023-09-12 19:27:39,879][47629] 8 agent workers initialized for env 2! -[2023-09-12 19:27:39,889][47662] Initializing env for player 0, init_info: {'port': 40701}... -[2023-09-12 19:27:39,919][47629] Decorrelating experience for 0 frames... -[2023-09-12 19:27:39,922][47629] Port 40501 is available -[2023-09-12 19:27:39,922][47629] Using port 40501 -[2023-09-12 19:27:39,922][47629] Initializing env for player 0, init_info: {'port': 40501}... -[2023-09-12 19:27:39,933][47662] Using port 40701 on host... -[2023-09-12 19:27:39,942][47662] Initializing env for player 1, init_info: {'port': 40701}... -[2023-09-12 19:27:39,953][47629] Using port 40501 on host... -[2023-09-12 19:27:39,973][47629] Initializing env for player 1, init_info: {'port': 40501}... -[2023-09-12 19:27:39,995][47662] Initializing env for player 2, init_info: {'port': 40701}... -[2023-09-12 19:27:40,023][47629] Initializing env for player 2, init_info: {'port': 40501}... -[2023-09-12 19:27:40,046][47662] Initializing env for player 3, init_info: {'port': 40701}... -[2023-09-12 19:27:40,082][47629] Initializing env for player 3, init_info: {'port': 40501}... -[2023-09-12 19:27:40,107][47662] Initializing env for player 4, init_info: {'port': 40701}... -[2023-09-12 19:27:40,139][47629] Initializing env for player 4, init_info: {'port': 40501}... -[2023-09-12 19:27:40,167][47662] Initializing env for player 5, init_info: {'port': 40701}... -[2023-09-12 19:27:40,195][47629] Initializing env for player 5, init_info: {'port': 40501}... -[2023-09-12 19:27:40,223][47662] Initializing env for player 6, init_info: {'port': 40701}... -[2023-09-12 19:27:40,251][47629] Initializing env for player 6, init_info: {'port': 40501}... -[2023-09-12 19:27:40,266][47593] Port 40303 is available -[2023-09-12 19:27:40,266][47593] Using port 40303 -[2023-09-12 19:27:40,267][47593] Initializing env for player 0, init_info: {'port': 40303}... -[2023-09-12 19:27:40,283][47662] Initializing env for player 7, init_info: {'port': 40701}... -[2023-09-12 19:27:40,312][47593] Using port 40303 on host... -[2023-09-12 19:27:40,314][47629] Initializing env for player 7, init_info: {'port': 40501}... -[2023-09-12 19:27:40,326][47593] Initializing env for player 1, init_info: {'port': 40303}... -[2023-09-12 19:27:40,376][47593] Initializing env for player 2, init_info: {'port': 40303}... -[2023-09-12 19:27:40,408][47628] Port 40603 is available -[2023-09-12 19:27:40,408][47628] Using port 40603 -[2023-09-12 19:27:40,409][47628] Initializing env for player 0, init_info: {'port': 40603}... -[2023-09-12 19:27:40,421][47664] Port 41003 is available -[2023-09-12 19:27:40,421][47664] Using port 41003 -[2023-09-12 19:27:40,421][47664] Initializing env for player 0, init_info: {'port': 41003}... -[2023-09-12 19:27:40,435][47593] Initializing env for player 3, init_info: {'port': 40303}... -[2023-09-12 19:27:40,441][47628] Using port 40603 on host... -[2023-09-12 19:27:40,452][47664] Using port 41003 on host... -[2023-09-12 19:27:40,460][47628] Initializing env for player 1, init_info: {'port': 40603}... -[2023-09-12 19:27:40,472][47664] Initializing env for player 1, init_info: {'port': 41003}... -[2023-09-12 19:27:40,487][47593] Initializing env for player 4, init_info: {'port': 40303}... -[2023-09-12 19:27:40,505][47663] Initialized w:6 v:2 player:0 -[2023-09-12 19:27:40,506][47663] Initialized w:6 v:2 player:6 -[2023-09-12 19:27:40,507][47663] Initialized w:6 v:2 player:4 -[2023-09-12 19:27:40,508][47663] Initialized w:6 v:2 player:3 -[2023-09-12 19:27:40,508][47663] Initialized w:6 v:2 player:1 -[2023-09-12 19:27:40,509][47663] Initialized w:6 v:2 player:5 -[2023-09-12 19:27:40,510][47663] Initialized w:6 v:2 player:2 -[2023-09-12 19:27:40,510][47628] Initializing env for player 2, init_info: {'port': 40603}... -[2023-09-12 19:27:40,510][47663] Initialized w:6 v:2 player:7 -[2023-09-12 19:27:40,512][47663] 8 agent workers initialized for env 6! -[2023-09-12 19:27:40,522][47630] Port 40803 is available -[2023-09-12 19:27:40,522][47630] Using port 40803 -[2023-09-12 19:27:40,526][47664] Initializing env for player 2, init_info: {'port': 41003}... -[2023-09-12 19:27:40,533][47627] Port 40403 is available -[2023-09-12 19:27:40,533][47627] Using port 40403 -[2023-09-12 19:27:40,534][47627] Initializing env for player 0, init_info: {'port': 40403}... -[2023-09-12 19:27:40,539][47593] Initializing env for player 5, init_info: {'port': 40303}... -[2023-09-12 19:27:40,563][47628] Initializing env for player 3, init_info: {'port': 40603}... -[2023-09-12 19:27:40,564][47627] Using port 40403 on host... -[2023-09-12 19:27:40,584][47627] Initializing env for player 1, init_info: {'port': 40403}... -[2023-09-12 19:27:40,586][47663] Decorrelating experience for 64 frames... -[2023-09-12 19:27:40,587][47664] Initializing env for player 3, init_info: {'port': 41003}... -[2023-09-12 19:27:40,591][47593] Initializing env for player 6, init_info: {'port': 40303}... -[2023-09-12 19:27:40,619][47628] Initializing env for player 4, init_info: {'port': 40603}... -[2023-09-12 19:27:40,635][47664] Initializing env for player 4, init_info: {'port': 41003}... -[2023-09-12 19:27:40,635][47627] Initializing env for player 2, init_info: {'port': 40403}... -[2023-09-12 19:27:40,683][47593] Initializing env for player 7, init_info: {'port': 40303}... -[2023-09-12 19:27:40,685][47627] Initializing env for player 3, init_info: {'port': 40403}... -[2023-09-12 19:27:40,687][47628] Initializing env for player 5, init_info: {'port': 40603}... -[2023-09-12 19:27:40,699][47664] Initializing env for player 5, init_info: {'port': 41003}... -[2023-09-12 19:27:40,733][47628] Initializing env for player 6, init_info: {'port': 40603}... -[2023-09-12 19:27:40,739][47627] Initializing env for player 4, init_info: {'port': 40403}... -[2023-09-12 19:27:40,763][47664] Initializing env for player 6, init_info: {'port': 41003}... -[2023-09-12 19:27:40,815][47664] Initializing env for player 7, init_info: {'port': 41003}... -[2023-09-12 19:27:40,816][47627] Initializing env for player 5, init_info: {'port': 40403}... -[2023-09-12 19:27:40,827][47628] Initializing env for player 7, init_info: {'port': 40603}... -[2023-09-12 19:27:40,883][47627] Initializing env for player 6, init_info: {'port': 40403}... -[2023-09-12 19:27:40,935][47627] Initializing env for player 7, init_info: {'port': 40403}... -[2023-09-12 19:27:41,496][47663] Port 40903 is available -[2023-09-12 19:27:41,496][47663] Using port 40903 -[2023-09-12 19:27:41,496][47663] Initializing env for player 0, init_info: {'port': 40903}... -[2023-09-12 19:27:41,524][47663] Using port 40903 on host... -[2023-09-12 19:27:41,547][47663] Initializing env for player 1, init_info: {'port': 40903}... -[2023-09-12 19:27:41,585][47662] Initialized w:4 v:1 player:4 -[2023-09-12 19:27:41,587][47662] Initialized w:4 v:1 player:6 -[2023-09-12 19:27:41,587][47662] Initialized w:4 v:1 player:2 -[2023-09-12 19:27:41,587][47662] Initialized w:4 v:1 player:7 -[2023-09-12 19:27:41,588][47662] Initialized w:4 v:1 player:5 -[2023-09-12 19:27:41,588][47662] Initialized w:4 v:1 player:3 -[2023-09-12 19:27:41,590][47662] Initialized w:4 v:1 player:0 -[2023-09-12 19:27:41,590][47662] Initialized w:4 v:1 player:1 -[2023-09-12 19:27:41,591][47662] 8 agent workers initialized for env 4! -[2023-09-12 19:27:41,611][47663] Initializing env for player 2, init_info: {'port': 40903}... -[2023-09-12 19:27:41,629][47629] Initialized w:2 v:1 player:2 -[2023-09-12 19:27:41,631][47629] Initialized w:2 v:1 player:0 -[2023-09-12 19:27:41,632][47629] Initialized w:2 v:1 player:7 -[2023-09-12 19:27:41,632][47629] Initialized w:2 v:1 player:5 -[2023-09-12 19:27:41,632][47629] Initialized w:2 v:1 player:1 -[2023-09-12 19:27:41,633][47629] Initialized w:2 v:1 player:3 -[2023-09-12 19:27:41,633][47629] Initialized w:2 v:1 player:6 -[2023-09-12 19:27:41,634][47629] Initialized w:2 v:1 player:4 -[2023-09-12 19:27:41,636][47629] 8 agent workers initialized for env 2! -[2023-09-12 19:27:41,645][47662] Decorrelating experience for 32 frames... -[2023-09-12 19:27:41,668][47663] Initializing env for player 3, init_info: {'port': 40903}... -[2023-09-12 19:27:41,683][47630] Initializing env for player 0, init_info: {'port': 40803}... -[2023-09-12 19:27:41,690][47629] Decorrelating experience for 32 frames... -[2023-09-12 19:27:41,718][47663] Initializing env for player 4, init_info: {'port': 40903}... -[2023-09-12 19:27:41,729][47630] Using port 40803 on host... -[2023-09-12 19:27:41,733][47630] Initializing env for player 1, init_info: {'port': 40803}... -[2023-09-12 19:27:41,775][47663] Initializing env for player 5, init_info: {'port': 40903}... -[2023-09-12 19:27:41,789][47630] Initializing env for player 2, init_info: {'port': 40803}... -[2023-09-12 19:27:41,835][47663] Initializing env for player 6, init_info: {'port': 40903}... -[2023-09-12 19:27:41,843][47630] Initializing env for player 3, init_info: {'port': 40803}... -[2023-09-12 19:27:41,895][47630] Initializing env for player 4, init_info: {'port': 40803}... -[2023-09-12 19:27:41,931][47663] Initializing env for player 7, init_info: {'port': 40903}... -[2023-09-12 19:27:41,946][47630] Initializing env for player 5, init_info: {'port': 40803}... -[2023-09-12 19:27:41,978][47662] Multi agent env, num agents: 8 -[2023-09-12 19:27:41,999][47630] Initializing env for player 6, init_info: {'port': 40803}... -[2023-09-12 19:27:42,009][47662] Multi agent env, num agents: 8 -[2023-09-12 19:27:42,039][47662] Port 40702 is available -[2023-09-12 19:27:42,040][47662] Using port 40702 -[2023-09-12 19:27:42,051][47629] Multi agent env, num agents: 8 -[2023-09-12 19:27:42,055][47630] Initializing env for player 7, init_info: {'port': 40803}... -[2023-09-12 19:27:42,092][47629] Multi agent env, num agents: 8 -[2023-09-12 19:27:42,139][47629] Port 40502 is available -[2023-09-12 19:27:42,139][47629] Using port 40502 -[2023-09-12 19:27:42,140][47629] Initializing env for player 0, init_info: {'port': 40502}... -[2023-09-12 19:27:42,174][47593] Initialized w:0 v:3 player:7 -[2023-09-12 19:27:42,176][47593] Initialized w:0 v:3 player:0 -[2023-09-12 19:27:42,176][47593] Initialized w:0 v:3 player:4 -[2023-09-12 19:27:42,177][47593] Initialized w:0 v:3 player:1 -[2023-09-12 19:27:42,177][47593] Initialized w:0 v:3 player:5 -[2023-09-12 19:27:42,177][47593] Initialized w:0 v:3 player:2 -[2023-09-12 19:27:42,177][47593] Initialized w:0 v:3 player:6 -[2023-09-12 19:27:42,178][47593] Initialized w:0 v:3 player:3 -[2023-09-12 19:27:42,180][47593] 8 agent workers initialized for env 0! -[2023-09-12 19:27:42,184][47629] Using port 40502 on host... -[2023-09-12 19:27:42,195][47629] Initializing env for player 1, init_info: {'port': 40502}... -[2023-09-12 19:27:42,219][47593] Decorrelating experience for 96 frames... -[2023-09-12 19:27:42,247][47627] Initialized w:1 v:3 player:1 -[2023-09-12 19:27:42,249][47627] Initialized w:1 v:3 player:4 -[2023-09-12 19:27:42,250][47627] Initialized w:1 v:3 player:2 -[2023-09-12 19:27:42,252][47627] Initialized w:1 v:3 player:0 -[2023-09-12 19:27:42,253][47627] Initialized w:1 v:3 player:6 -[2023-09-12 19:27:42,253][47627] Initialized w:1 v:3 player:7 -[2023-09-12 19:27:42,255][47627] Initialized w:1 v:3 player:3 -[2023-09-12 19:27:42,255][47629] Initializing env for player 2, init_info: {'port': 40502}... -[2023-09-12 19:27:42,256][47627] Initialized w:1 v:3 player:5 -[2023-09-12 19:27:42,257][47627] 8 agent workers initialized for env 1! -[2023-09-12 19:27:42,303][47629] Initializing env for player 3, init_info: {'port': 40502}... -[2023-09-12 19:27:42,317][47627] Decorrelating experience for 96 frames... -[2023-09-12 19:27:42,331][47664] Initialized w:7 v:3 player:5 -[2023-09-12 19:27:42,331][47664] Initialized w:7 v:3 player:4 -[2023-09-12 19:27:42,332][47664] Initialized w:7 v:3 player:2 -[2023-09-12 19:27:42,334][47664] Initialized w:7 v:3 player:1 -[2023-09-12 19:27:42,335][47628] Initialized w:3 v:3 player:1 -[2023-09-12 19:27:42,334][47664] Initialized w:7 v:3 player:6 -[2023-09-12 19:27:42,335][47664] Initialized w:7 v:3 player:0 -[2023-09-12 19:27:42,335][47664] Initialized w:7 v:3 player:3 -[2023-09-12 19:27:42,335][47664] Initialized w:7 v:3 player:7 -[2023-09-12 19:27:42,337][47628] Initialized w:3 v:3 player:2 -[2023-09-12 19:27:42,338][47664] 8 agent workers initialized for env 7! -[2023-09-12 19:27:42,343][47628] Initialized w:3 v:3 player:0 -[2023-09-12 19:27:42,343][47628] Initialized w:3 v:3 player:7 -[2023-09-12 19:27:42,345][47628] Initialized w:3 v:3 player:6 -[2023-09-12 19:27:42,345][47628] Initialized w:3 v:3 player:3 -[2023-09-12 19:27:42,346][47628] Initialized w:3 v:3 player:5 -[2023-09-12 19:27:42,347][47662] Initializing env for player 0, init_info: {'port': 40702}... -[2023-09-12 19:27:42,361][47629] Initializing env for player 4, init_info: {'port': 40502}... -[2023-09-12 19:27:42,376][47664] Decorrelating experience for 96 frames... -[2023-09-12 19:27:42,384][47662] Using port 40702 on host... -[2023-09-12 19:27:42,397][47662] Initializing env for player 1, init_info: {'port': 40702}... -[2023-09-12 19:27:42,411][47629] Initializing env for player 5, init_info: {'port': 40502}... -[2023-09-12 19:27:42,451][47662] Initializing env for player 2, init_info: {'port': 40702}... -[2023-09-12 19:27:42,475][47629] Initializing env for player 6, init_info: {'port': 40502}... -[2023-09-12 19:27:42,500][47662] Initializing env for player 3, init_info: {'port': 40702}... -[2023-09-12 19:27:42,531][47629] Initializing env for player 7, init_info: {'port': 40502}... -[2023-09-12 19:27:42,550][47662] Initializing env for player 4, init_info: {'port': 40702}... -[2023-09-12 19:27:42,603][47662] Initializing env for player 5, init_info: {'port': 40702}... -[2023-09-12 19:27:42,659][47662] Initializing env for player 6, init_info: {'port': 40702}... -[2023-09-12 19:27:42,711][47662] Initializing env for player 7, init_info: {'port': 40702}... -[2023-09-12 19:27:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:27:43,214][47663] Initialized w:6 v:3 player:6 -[2023-09-12 19:27:43,215][47663] Initialized w:6 v:3 player:4 -[2023-09-12 19:27:43,216][47663] Initialized w:6 v:3 player:3 -[2023-09-12 19:27:43,216][47663] Initialized w:6 v:3 player:0 -[2023-09-12 19:27:43,216][47663] Initialized w:6 v:3 player:7 -[2023-09-12 19:27:43,219][47663] Initialized w:6 v:3 player:5 -[2023-09-12 19:27:43,219][47663] Initialized w:6 v:3 player:2 -[2023-09-12 19:27:43,334][47628] Initialized w:3 v:3 player:4 -[2023-09-12 19:27:43,335][47628] 8 agent workers initialized for env 3! -[2023-09-12 19:27:43,399][47628] Decorrelating experience for 96 frames... -[2023-09-12 19:27:43,465][47630] Initialized w:5 v:3 player:6 -[2023-09-12 19:27:43,467][47630] Initialized w:5 v:3 player:4 -[2023-09-12 19:27:43,467][47630] Initialized w:5 v:3 player:5 -[2023-09-12 19:27:43,467][47630] Initialized w:5 v:3 player:1 -[2023-09-12 19:27:43,467][47630] Initialized w:5 v:3 player:2 -[2023-09-12 19:27:43,467][47630] Initialized w:5 v:3 player:7 -[2023-09-12 19:27:43,467][47630] Initialized w:5 v:3 player:3 -[2023-09-12 19:27:43,467][47630] Initialized w:5 v:3 player:0 -[2023-09-12 19:27:43,470][47630] 8 agent workers initialized for env 5! -[2023-09-12 19:27:43,521][47630] Decorrelating experience for 96 frames... -[2023-09-12 19:27:43,768][47629] Initialized w:2 v:2 player:5 -[2023-09-12 19:27:43,768][47629] Initialized w:2 v:2 player:0 -[2023-09-12 19:27:43,769][47629] Initialized w:2 v:2 player:4 -[2023-09-12 19:27:43,769][47629] Initialized w:2 v:2 player:3 -[2023-09-12 19:27:43,770][47629] Initialized w:2 v:2 player:1 -[2023-09-12 19:27:43,770][47629] Initialized w:2 v:2 player:7 -[2023-09-12 19:27:43,771][47629] Initialized w:2 v:2 player:6 -[2023-09-12 19:27:43,771][47629] Initialized w:2 v:2 player:2 -[2023-09-12 19:27:43,773][47629] 8 agent workers initialized for env 2! -[2023-09-12 19:27:43,820][47629] Decorrelating experience for 64 frames... -[2023-09-12 19:27:44,129][47662] Initialized w:4 v:2 player:1 -[2023-09-12 19:27:44,131][47662] Initialized w:4 v:2 player:7 -[2023-09-12 19:27:44,131][47662] Initialized w:4 v:2 player:4 -[2023-09-12 19:27:44,132][47662] Initialized w:4 v:2 player:6 -[2023-09-12 19:27:44,132][47662] Initialized w:4 v:2 player:5 -[2023-09-12 19:27:44,133][47662] Initialized w:4 v:2 player:2 -[2023-09-12 19:27:44,133][47662] Initialized w:4 v:2 player:0 -[2023-09-12 19:27:44,133][47662] Initialized w:4 v:2 player:3 -[2023-09-12 19:27:44,135][47662] 8 agent workers initialized for env 4! -[2023-09-12 19:27:44,180][47662] Decorrelating experience for 64 frames... -[2023-09-12 19:27:44,590][47629] Port 40503 is available -[2023-09-12 19:27:44,590][47629] Using port 40503 -[2023-09-12 19:27:44,591][47629] Initializing env for player 0, init_info: {'port': 40503}... -[2023-09-12 19:27:44,636][47629] Using port 40503 on host... -[2023-09-12 19:27:44,643][47629] Initializing env for player 1, init_info: {'port': 40503}... -[2023-09-12 19:27:44,719][47629] Initializing env for player 2, init_info: {'port': 40503}... -[2023-09-12 19:27:44,775][47629] Initializing env for player 3, init_info: {'port': 40503}... -[2023-09-12 19:27:44,839][47629] Initializing env for player 4, init_info: {'port': 40503}... -[2023-09-12 19:27:44,892][47629] Initializing env for player 5, init_info: {'port': 40503}... -[2023-09-12 19:27:44,959][47629] Initializing env for player 6, init_info: {'port': 40503}... -[2023-09-12 19:27:45,011][47629] Initializing env for player 7, init_info: {'port': 40503}... -[2023-09-12 19:27:45,147][47662] Port 40703 is available -[2023-09-12 19:27:45,148][47662] Using port 40703 -[2023-09-12 19:27:45,148][47662] Initializing env for player 0, init_info: {'port': 40703}... -[2023-09-12 19:27:45,186][47662] Using port 40703 on host... -[2023-09-12 19:27:45,199][47662] Initializing env for player 1, init_info: {'port': 40703}... -[2023-09-12 19:27:45,265][47662] Initializing env for player 2, init_info: {'port': 40703}... -[2023-09-12 19:27:45,315][47662] Initializing env for player 3, init_info: {'port': 40703}... -[2023-09-12 19:27:45,371][47662] Initializing env for player 4, init_info: {'port': 40703}... -[2023-09-12 19:27:45,424][47662] Initializing env for player 5, init_info: {'port': 40703}... -[2023-09-12 19:27:45,478][47662] Initializing env for player 6, init_info: {'port': 40703}... -[2023-09-12 19:27:45,535][47662] Initializing env for player 7, init_info: {'port': 40703}... -[2023-09-12 19:27:46,226][47474] Signal inference workers to stop experience collection... -[2023-09-12 19:27:46,236][47594] InferenceWorker_p0-w0: stopping experience collection -[2023-09-12 19:27:46,558][47629] Initialized w:2 v:3 player:4 -[2023-09-12 19:27:46,560][47629] Initialized w:2 v:3 player:0 -[2023-09-12 19:27:46,561][47629] Initialized w:2 v:3 player:1 -[2023-09-12 19:27:46,561][47629] Initialized w:2 v:3 player:2 -[2023-09-12 19:27:46,561][47629] Initialized w:2 v:3 player:6 -[2023-09-12 19:27:46,562][47629] Initialized w:2 v:3 player:3 -[2023-09-12 19:27:46,562][47629] Initialized w:2 v:3 player:7 -[2023-09-12 19:27:46,562][47629] Initialized w:2 v:3 player:5 -[2023-09-12 19:27:46,564][47629] 8 agent workers initialized for env 2! -[2023-09-12 19:27:46,612][47629] Decorrelating experience for 96 frames... -[2023-09-12 19:27:47,035][47662] Initialized w:4 v:3 player:5 -[2023-09-12 19:27:47,038][47662] Initialized w:4 v:3 player:7 -[2023-09-12 19:27:47,039][47662] Initialized w:4 v:3 player:3 -[2023-09-12 19:27:47,039][47662] Initialized w:4 v:3 player:0 -[2023-09-12 19:27:47,039][47662] Initialized w:4 v:3 player:2 -[2023-09-12 19:27:47,039][47662] Initialized w:4 v:3 player:4 -[2023-09-12 19:27:47,039][47662] Initialized w:4 v:3 player:6 -[2023-09-12 19:27:47,040][47662] Initialized w:4 v:3 player:1 -[2023-09-12 19:27:47,042][47662] 8 agent workers initialized for env 4! -[2023-09-12 19:27:47,045][47474] EvtLoop [learner_proc0_evt_loop, process=learner_proc0] unhandled exception in slot='on_new_training_batch' connected to emitter=Emitter(object_id='Batcher_0', signal_name='training_batches_available'), args=(0,) -Traceback (most recent call last): - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py", line 355, in _process_signal - slot_callable(*args) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner_worker.py", line 150, in on_new_training_batch - stats = self.learner.train(self.batcher.training_batches[batch_idx]) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 1046, in train - train_stats = self._train(buff, self.cfg.batch_size, experience_size, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 731, in _train - ) = self._calculate_losses(mb, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 649, in _calculate_losses - exploration_loss = self.exploration_loss_func(action_distribution, valids, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 477, in _symmetric_kl_exploration_loss - kl_prior = action_distribution.symmetric_kl_with_uniform_prior() - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py", line 247, in symmetric_kl_with_uniform_prior - sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions] - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py", line 247, in - sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions] -AttributeError: 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' -[2023-09-12 19:27:47,046][47474] Unhandled exception 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' in evt loop learner_proc0_evt_loop -[2023-09-12 19:27:47,096][47662] Decorrelating experience for 96 frames... -[2023-09-12 19:27:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 189.9. Samples: 2848. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:27:48,301][45761] Heartbeat connected on Batcher_0 -[2023-09-12 19:27:48,310][45761] Heartbeat connected on InferenceWorker_p0-w0 -[2023-09-12 19:27:48,318][45761] Heartbeat connected on RolloutWorker_w0 -[2023-09-12 19:27:48,322][45761] Heartbeat connected on RolloutWorker_w1 -[2023-09-12 19:27:48,327][45761] Heartbeat connected on RolloutWorker_w2 -[2023-09-12 19:27:48,332][45761] Heartbeat connected on RolloutWorker_w3 -[2023-09-12 19:27:48,336][45761] Heartbeat connected on RolloutWorker_w4 -[2023-09-12 19:27:48,341][45761] Heartbeat connected on RolloutWorker_w5 -[2023-09-12 19:27:48,350][45761] Heartbeat connected on RolloutWorker_w7 -[2023-09-12 19:27:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 252.8. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:27:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 202.2. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:28:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 168.5. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:28:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 144.5. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:28:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 126.4. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:28:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 112.4. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:28:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 112.4. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:28:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 112.4. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:28:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 49.1. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:28:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:28:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:28:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:28:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:28:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:29:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:29:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:29:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:29:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:29:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:29:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:29:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:29:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:29:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:29:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:29:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:29:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:30:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:30:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:30:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:30:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:30:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:30:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:30:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:30:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:30:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:30:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:30:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:30:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:31:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:31:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:31:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:31:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:31:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:31:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:31:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:31:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:31:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:31:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:31:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:31:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:32:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:32:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:32:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:32:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:32:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:32:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:32:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:32:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:32:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:32:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:32:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:32:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:33:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:33:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:33:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:33:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:33:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:33:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:33:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:33:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:33:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:33:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:33:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:33:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:34:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:34:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:34:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:34:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:34:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:34:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:34:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:34:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:34:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:34:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:34:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:34:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:35:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:35:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:35:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:35:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:35:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:35:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:35:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:35:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:35:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:35:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:35:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:35:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:36:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:36:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:36:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:36:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:36:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:36:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:36:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:36:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:36:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:36:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:36:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:36:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:37:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:37:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:37:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:37:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:37:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:37:23,055][45761] Components not started: LearnerWorker_p0, RolloutWorker_w6, wait_time=600.0 seconds -[2023-09-12 19:37:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:37:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:37:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:37:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:37:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:37:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:37:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:38:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:38:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:38:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:38:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:38:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:38:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:38:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:38:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:38:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:38:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:38:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:38:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:39:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:39:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:39:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:39:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:39:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:39:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:39:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:39:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:39:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:39:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:39:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:39:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:40:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:40:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:40:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:40:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:40:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:40:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:40:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:40:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:40:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:40:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:40:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:40:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:41:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:41:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:41:13,050][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:41:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:41:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:41:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:41:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:41:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:41:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:41:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:41:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:41:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:42:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:42:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:42:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:42:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:42:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:42:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:42:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:42:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:42:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:42:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:42:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:42:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:43:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:43:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:43:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:43:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:43:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:43:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:43:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:43:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:43:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:43:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:43:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:43:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:44:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:44:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:44:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:44:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:44:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:44:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:44:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:44:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:44:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:44:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:44:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:44:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:45:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:45:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:45:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:45:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:45:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:45:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:45:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:45:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:45:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:45:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:45:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:45:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:46:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:46:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:46:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:46:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:46:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:46:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:46:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:46:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:46:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:46:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:46:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:46:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:47:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:47:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:47:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:47:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:47:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:47:23,055][45761] Components not started: LearnerWorker_p0, RolloutWorker_w6, wait_time=1200.0 seconds -[2023-09-12 19:47:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:47:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:47:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:47:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:47:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:47:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:47:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:48:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:48:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:48:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:48:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:48:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:48:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:48:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:48:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:48:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:48:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:48:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:48:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:49:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:49:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:49:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:49:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:49:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:49:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:49:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:49:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:49:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:49:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:49:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:49:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:50:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:50:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:50:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:50:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:50:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:50:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:50:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:50:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:50:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:50:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:50:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:50:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:51:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:51:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:51:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:51:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:51:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:51:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:51:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:51:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:51:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:51:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:51:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:51:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:52:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:52:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:52:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:52:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:52:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:52:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:52:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:52:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:52:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:52:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:52:53,050][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:52:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:53:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:53:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:53:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:53:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:53:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:53:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:53:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:53:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:53:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:53:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:53:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:53:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:54:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:54:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:54:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:54:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:54:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:54:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:54:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:54:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:54:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:54:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:54:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:54:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:55:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:55:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:55:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:55:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:55:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:55:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:55:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:55:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:55:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:55:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:55:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:55:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:56:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:56:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:56:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:56:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:56:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:56:28,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:56:33,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:56:38,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:56:43,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:56:48,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:56:53,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:56:58,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:57:03,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:57:08,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:57:13,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:57:18,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:57:23,049][45761] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5056. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 19:57:23,054][45761] Components not started: LearnerWorker_p0, RolloutWorker_w6, wait_time=1800.0 seconds -[2023-09-12 19:57:23,057][45761] Components take too long to start: LearnerWorker_p0, RolloutWorker_w6. Aborting the experiment! - - - -[2023-09-12 19:57:23,059][47474] Stopping Batcher_0... -[2023-09-12 19:57:23,059][47474] Loop batcher_evt_loop terminating... -[2023-09-12 19:57:23,059][45761] Component Batcher_0 stopped! -[2023-09-12 19:57:23,062][45761] Waiting for ['LearnerWorker_p0', 'InferenceWorker_p0-w0', 'RolloutWorker_w0', 'RolloutWorker_w1', 'RolloutWorker_w2', 'RolloutWorker_w3', 'RolloutWorker_w4', 'RolloutWorker_w5', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... -[2023-09-12 19:57:23,073][47594] Weights refcount: 2 0 -[2023-09-12 19:57:23,074][47594] Stopping InferenceWorker_p0-w0... -[2023-09-12 19:57:23,074][47594] Loop inference_proc0-0_evt_loop terminating... -[2023-09-12 19:57:23,074][45761] Component InferenceWorker_p0-w0 stopped! -[2023-09-12 19:57:23,076][45761] Waiting for ['LearnerWorker_p0', 'RolloutWorker_w0', 'RolloutWorker_w1', 'RolloutWorker_w2', 'RolloutWorker_w3', 'RolloutWorker_w4', 'RolloutWorker_w5', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... -[2023-09-12 19:57:26,275][47629] Stopping RolloutWorker_w2... -[2023-09-12 19:57:26,275][47627] Stopping RolloutWorker_w1... -[2023-09-12 19:57:26,275][47629] Loop rollout_proc2_evt_loop terminating... -[2023-09-12 19:57:26,275][47593] Stopping RolloutWorker_w0... -[2023-09-12 19:57:26,276][47627] Loop rollout_proc1_evt_loop terminating... -[2023-09-12 19:57:26,276][47662] Stopping RolloutWorker_w4... -[2023-09-12 19:57:26,276][47593] Loop rollout_proc0_evt_loop terminating... -[2023-09-12 19:57:26,276][47630] Stopping RolloutWorker_w5... -[2023-09-12 19:57:26,276][47662] Loop rollout_proc4_evt_loop terminating... -[2023-09-12 19:57:26,276][47628] Stopping RolloutWorker_w3... -[2023-09-12 19:57:26,277][47630] Loop rollout_proc5_evt_loop terminating... -[2023-09-12 19:57:26,277][47628] Loop rollout_proc3_evt_loop terminating... -[2023-09-12 19:57:26,277][47664] Stopping RolloutWorker_w7... -[2023-09-12 19:57:26,276][45761] Component LearnerWorker_p0 process died already! Don't wait for it. -[2023-09-12 19:57:26,278][47664] Loop rollout_proc7_evt_loop terminating... -[2023-09-12 19:57:26,278][45761] Component RolloutWorker_w2 stopped! -[2023-09-12 19:57:26,279][45761] Waiting for ['RolloutWorker_w0', 'RolloutWorker_w1', 'RolloutWorker_w3', 'RolloutWorker_w4', 'RolloutWorker_w5', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... -[2023-09-12 19:57:26,281][45761] Component RolloutWorker_w1 stopped! -[2023-09-12 19:57:26,283][45761] Waiting for ['RolloutWorker_w0', 'RolloutWorker_w3', 'RolloutWorker_w4', 'RolloutWorker_w5', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... -[2023-09-12 19:57:26,285][45761] Component RolloutWorker_w0 stopped! -[2023-09-12 19:57:26,286][45761] Waiting for ['RolloutWorker_w3', 'RolloutWorker_w4', 'RolloutWorker_w5', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... -[2023-09-12 19:57:26,287][45761] Component RolloutWorker_w4 stopped! -[2023-09-12 19:57:26,289][45761] Waiting for ['RolloutWorker_w3', 'RolloutWorker_w5', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... -[2023-09-12 19:57:26,290][45761] Component RolloutWorker_w5 stopped! -[2023-09-12 19:57:26,291][45761] Waiting for ['RolloutWorker_w3', 'RolloutWorker_w6', 'RolloutWorker_w7'] to stop... -[2023-09-12 19:57:26,292][45761] Component RolloutWorker_w3 stopped! -[2023-09-12 19:57:26,293][45761] Waiting for ['RolloutWorker_w6', 'RolloutWorker_w7'] to stop... -[2023-09-12 19:57:26,295][45761] Component RolloutWorker_w7 stopped! -[2023-09-12 19:57:26,296][45761] Waiting for ['RolloutWorker_w6'] to stop... -[2023-09-12 20:58:13,927][47663] VizDoom game.init() threw an exception SignalException('Signal SIGINT received. ViZDoom instance has been closed.'). Terminate process... -[2023-09-12 20:58:13,931][47663] Failed with error RuntimeError('Critical error: worker stuck on initialization. Abort! '), trying again -[2023-09-12 20:58:13,946][45761] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 45761], exiting... -[2023-09-12 20:58:13,948][45761] Runner profile tree view: -main_loop: 5445.5967 -[2023-09-12 20:58:13,949][45761] Collected {0: 0}, FPS: 0.0 -[2023-09-12 20:58:13,989][45761] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json -[2023-09-12 20:58:13,990][45761] Overriding arg 'num_workers' with value 1 passed from command line -[2023-09-12 20:58:13,991][45761] Adding new argument 'no_render'=True that is not in the saved config file! -[2023-09-12 20:58:13,992][45761] Adding new argument 'save_video'=True that is not in the saved config file! -[2023-09-12 20:58:13,993][45761] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file! -[2023-09-12 20:58:13,994][45761] Adding new argument 'video_name'=None that is not in the saved config file! -[2023-09-12 20:58:13,996][45761] Adding new argument 'max_num_frames'=1000000000.0 that is not in the saved config file! -[2023-09-12 20:58:13,997][45761] Adding new argument 'max_num_episodes'=10 that is not in the saved config file! -[2023-09-12 20:58:13,998][45761] Adding new argument 'push_to_hub'=False that is not in the saved config file! -[2023-09-12 20:58:13,999][45761] Adding new argument 'hf_repository'=None that is not in the saved config file! -[2023-09-12 20:58:14,000][45761] Adding new argument 'policy_index'=0 that is not in the saved config file! -[2023-09-12 20:58:14,001][45761] Adding new argument 'eval_deterministic'=False that is not in the saved config file! -[2023-09-12 20:58:14,002][45761] Adding new argument 'train_script'=None that is not in the saved config file! -[2023-09-12 20:58:14,003][45761] Adding new argument 'enjoy_script'=None that is not in the saved config file! -[2023-09-12 20:58:14,003][45761] Using frameskip 1 and render_action_repeat=4 for evaluation -[2023-09-12 20:58:14,006][45761] Multi agent env, num agents: 8 -[2023-09-12 20:58:14,035][45761] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 20:58:14,041][45761] RunningMeanStd input shape: (23,) -[2023-09-12 20:58:14,042][45761] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 20:58:14,044][45761] RunningMeanStd input shape: (1,) -[2023-09-12 20:58:14,057][45761] ConvEncoder: input_channels=3 -[2023-09-12 20:58:14,193][45761] Conv encoder output size: 512 -[2023-09-12 20:58:14,196][45761] Policy head output size: 640 -[2023-09-12 20:58:14,937][47663] Port 40903 is available -[2023-09-12 20:58:14,937][47663] Using port 40903 -[2023-09-12 20:58:14,938][47663] Initializing env for player 0, init_info: {'port': 40903}... -[2023-09-12 20:58:14,972][47663] Using port 40903 on host... -[2023-09-12 20:58:14,989][47663] Initializing env for player 1, init_info: {'port': 40903}... -[2023-09-12 20:58:15,039][47663] Initializing env for player 2, init_info: {'port': 40903}... -[2023-09-12 20:58:15,089][47663] Initializing env for player 3, init_info: {'port': 40903}... -[2023-09-12 20:58:15,151][47663] Initializing env for player 4, init_info: {'port': 40903}... -[2023-09-12 20:58:15,203][47663] Initializing env for player 5, init_info: {'port': 40903}... -[2023-09-12 20:58:15,259][47663] Initializing env for player 6, init_info: {'port': 40903}... -[2023-09-12 20:58:15,307][47663] Initializing env for player 7, init_info: {'port': 40903}... -[2023-09-12 20:58:15,335][45761] No checkpoints found -[2023-09-12 20:58:16,238][45761] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json -[2023-09-12 20:58:16,239][45761] Overriding arg 'num_workers' with value 1 passed from command line -[2023-09-12 20:58:16,241][45761] Adding new argument 'no_render'=True that is not in the saved config file! -[2023-09-12 20:58:16,242][45761] Adding new argument 'save_video'=True that is not in the saved config file! -[2023-09-12 20:58:16,243][45761] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file! -[2023-09-12 20:58:16,244][45761] Adding new argument 'video_name'=None that is not in the saved config file! -[2023-09-12 20:58:16,245][45761] Adding new argument 'max_num_frames'=100000 that is not in the saved config file! -[2023-09-12 20:58:16,247][45761] Adding new argument 'max_num_episodes'=10 that is not in the saved config file! -[2023-09-12 20:58:16,248][45761] Adding new argument 'push_to_hub'=True that is not in the saved config file! -[2023-09-12 20:58:16,249][45761] Adding new argument 'hf_repository'='MattStammers/vizdoom_fight' that is not in the saved config file! -[2023-09-12 20:58:16,250][45761] Adding new argument 'policy_index'=0 that is not in the saved config file! -[2023-09-12 20:58:16,250][45761] Adding new argument 'eval_deterministic'=False that is not in the saved config file! -[2023-09-12 20:58:16,251][45761] Adding new argument 'train_script'=None that is not in the saved config file! -[2023-09-12 20:58:16,252][45761] Adding new argument 'enjoy_script'=None that is not in the saved config file! -[2023-09-12 20:58:16,252][45761] Using frameskip 1 and render_action_repeat=4 for evaluation -[2023-09-12 20:58:16,253][45761] Multi agent env, num agents: 8 -[2023-09-12 20:58:16,283][45761] RunningMeanStd input shape: (23,) -[2023-09-12 20:58:16,285][45761] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 20:58:16,286][45761] RunningMeanStd input shape: (1,) -[2023-09-12 20:58:16,295][45761] ConvEncoder: input_channels=3 -[2023-09-12 20:58:16,342][45761] Conv encoder output size: 512 -[2023-09-12 20:58:16,345][45761] Policy head output size: 640 -[2023-09-12 20:58:16,376][45761] No checkpoints found -[2023-09-12 20:58:16,490][47663] Initialized w:6 v:3 player:6 -[2023-09-12 20:58:16,491][47663] Initialized w:6 v:3 player:0 -[2023-09-12 20:58:16,492][47663] Initialized w:6 v:3 player:2 -[2023-09-12 20:58:16,493][47663] Initialized w:6 v:3 player:3 -[2023-09-12 20:58:16,493][47663] Initialized w:6 v:3 player:7 -[2023-09-12 20:58:16,493][47663] Initialized w:6 v:3 player:4 -[2023-09-12 20:58:16,494][47663] Initialized w:6 v:3 player:5 -[2023-09-12 20:58:16,496][47663] Initialized w:6 v:3 player:1 -[2023-09-12 20:58:16,497][47663] 8 agent workers initialized for env 6! -[2023-09-12 20:58:16,546][47663] Decorrelating experience for 96 frames... -[2023-09-12 20:58:20,712][47663] Stopping RolloutWorker_w6... -[2023-09-12 20:58:20,713][47663] Loop rollout_proc6_evt_loop terminating... -[2023-09-12 20:59:03,126][28625] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... -[2023-09-12 20:59:04,135][28625] Rollout worker 0 uses device cpu -[2023-09-12 20:59:04,136][28625] Rollout worker 1 uses device cpu -[2023-09-12 20:59:04,138][28625] Rollout worker 2 uses device cpu -[2023-09-12 20:59:04,139][28625] Rollout worker 3 uses device cpu -[2023-09-12 20:59:04,140][28625] Rollout worker 4 uses device cpu -[2023-09-12 20:59:04,142][28625] Rollout worker 5 uses device cpu -[2023-09-12 20:59:04,144][28625] Rollout worker 6 uses device cpu -[2023-09-12 20:59:04,144][28625] Rollout worker 7 uses device cpu -[2023-09-12 20:59:04,357][28625] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 20:59:04,358][28625] InferenceWorker_p0-w0: min num requests: 2 -[2023-09-12 20:59:04,384][28625] Starting all processes... -[2023-09-12 20:59:04,385][28625] Starting process learner_proc0 -[2023-09-12 20:59:06,069][29273] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 20:59:06,070][29273] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 -[2023-09-12 20:59:06,068][28625] Starting all processes... -[2023-09-12 20:59:06,076][28625] Starting process inference_proc0-0 -[2023-09-12 20:59:06,077][28625] Starting process rollout_proc0 -[2023-09-12 20:59:06,078][28625] Starting process rollout_proc1 -[2023-09-12 20:59:06,078][28625] Starting process rollout_proc2 -[2023-09-12 20:59:06,079][28625] Starting process rollout_proc3 -[2023-09-12 20:59:06,080][28625] Starting process rollout_proc4 -[2023-09-12 20:59:06,110][29273] Num visible devices: 1 -[2023-09-12 20:59:06,080][28625] Starting process rollout_proc5 -[2023-09-12 20:59:06,153][29273] Starting seed is not provided -[2023-09-12 20:59:06,153][29273] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 20:59:06,154][29273] Initializing actor-critic model on device cuda:0 -[2023-09-12 20:59:06,154][29273] RunningMeanStd input shape: (23,) -[2023-09-12 20:59:06,154][29273] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 20:59:06,155][29273] RunningMeanStd input shape: (1,) -[2023-09-12 20:59:06,084][28625] Starting process rollout_proc6 -[2023-09-12 20:59:06,172][29273] ConvEncoder: input_channels=3 -[2023-09-12 20:59:06,086][28625] Starting process rollout_proc7 -[2023-09-12 20:59:06,345][29273] Conv encoder output size: 512 -[2023-09-12 20:59:06,346][29273] Policy head output size: 640 -[2023-09-12 20:59:06,364][29273] Created Actor Critic model with architecture: -[2023-09-12 20:59:06,364][29273] ActorCriticSharedWeights( - (obs_normalizer): ObservationNormalizer( - (running_mean_std): RunningMeanStdDictInPlace( - (running_mean_std): ModuleDict( - (measurements): RunningMeanStdInPlace() - (obs): RunningMeanStdInPlace() - ) - ) - ) - (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) - (encoder): VizdoomEncoder( - (basic_encoder): ConvEncoder( - (enc): RecursiveScriptModule( - original_name=ConvEncoderImpl - (conv_head): RecursiveScriptModule( - original_name=Sequential - (0): RecursiveScriptModule(original_name=Conv2d) - (1): RecursiveScriptModule(original_name=ELU) - (2): RecursiveScriptModule(original_name=Conv2d) - (3): RecursiveScriptModule(original_name=ELU) - (4): RecursiveScriptModule(original_name=Conv2d) - (5): RecursiveScriptModule(original_name=ELU) - ) - (mlp_layers): RecursiveScriptModule( - original_name=Sequential - (0): RecursiveScriptModule(original_name=Linear) - (1): RecursiveScriptModule(original_name=ELU) - ) - ) - ) - (measurements_head): Sequential( - (0): Linear(in_features=23, out_features=128, bias=True) - (1): ELU(alpha=1.0) - (2): Linear(in_features=128, out_features=128, bias=True) - (3): ELU(alpha=1.0) - ) - ) - (core): ModelCoreRNN( - (core): GRU(640, 512) - ) - (decoder): MlpDecoder( - (mlp): Identity() - ) - (critic_linear): Linear(in_features=512, out_features=1, bias=True) - (action_parameterization): ActionParameterizationDefault( - (distribution_linear): Linear(in_features=512, out_features=15, bias=True) - ) -) -[2023-09-12 20:59:07,588][29273] Using optimizer -[2023-09-12 20:59:07,588][29273] No checkpoints found -[2023-09-12 20:59:07,589][29273] Did not load from checkpoint, starting from scratch! -[2023-09-12 20:59:07,589][29273] Initialized policy 0 weights for model version 0 -[2023-09-12 20:59:07,591][29273] LearnerWorker_p0 finished initialization! -[2023-09-12 20:59:07,591][29273] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 20:59:08,052][29485] Worker 1 uses CPU cores [4, 5, 6, 7] -[2023-09-12 20:59:08,091][29486] Worker 2 uses CPU cores [8, 9, 10, 11] -[2023-09-12 20:59:08,165][29520] Worker 4 uses CPU cores [16, 17, 18, 19] -[2023-09-12 20:59:08,224][29452] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 20:59:08,224][29452] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 -[2023-09-12 20:59:08,264][29452] Num visible devices: 1 -[2023-09-12 20:59:08,270][29453] Worker 0 uses CPU cores [0, 1, 2, 3] -[2023-09-12 20:59:08,271][29522] Worker 6 uses CPU cores [24, 25, 26, 27] -[2023-09-12 20:59:08,319][29519] Worker 3 uses CPU cores [12, 13, 14, 15] -[2023-09-12 20:59:08,404][29521] Worker 5 uses CPU cores [20, 21, 22, 23] -[2023-09-12 20:59:08,472][29523] Worker 7 uses CPU cores [28, 29, 30, 31] -[2023-09-12 20:59:08,998][29452] RunningMeanStd input shape: (23,) -[2023-09-12 20:59:08,998][29452] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 20:59:08,999][29452] RunningMeanStd input shape: (1,) -[2023-09-12 20:59:09,011][29452] ConvEncoder: input_channels=3 -[2023-09-12 20:59:09,118][29452] Conv encoder output size: 512 -[2023-09-12 20:59:09,119][29452] Policy head output size: 640 -[2023-09-12 20:59:09,192][28625] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 0. Throughput: 0: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 20:59:09,482][28625] Inference worker 0-0 is ready! -[2023-09-12 20:59:09,483][28625] All inference workers are ready! Signal rollout workers to start! -[2023-09-12 20:59:09,489][29486] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,490][29523] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,490][29521] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,490][29520] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,490][29522] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,490][29453] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,491][29485] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,491][29519] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,521][29486] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 20:59:09,523][29519] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 20:59:09,524][29522] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 20:59:09,524][29521] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 20:59:09,524][29520] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 20:59:09,524][29523] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 20:59:09,525][29453] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 20:59:09,526][29519] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,526][29486] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,527][29522] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,527][29521] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,527][29520] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,528][29523] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,529][29453] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,538][29485] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 20:59:09,541][29485] Multi agent env, num agents: 8 -[2023-09-12 20:59:09,558][29519] Port 40600 is available -[2023-09-12 20:59:09,558][29519] Using port 40600 -[2023-09-12 20:59:09,559][29519] Initializing env for player 0, init_info: {'port': 40600}... -[2023-09-12 20:59:09,559][29522] Port 40900 is available -[2023-09-12 20:59:09,559][29520] Port 40700 is available -[2023-09-12 20:59:09,560][29520] Using port 40700 -[2023-09-12 20:59:09,560][29522] Using port 40900 -[2023-09-12 20:59:09,560][29521] Port 40800 is available -[2023-09-12 20:59:09,560][29521] Using port 40800 -[2023-09-12 20:59:09,560][29523] Port 41000 is available -[2023-09-12 20:59:09,561][29520] Initializing env for player 0, init_info: {'port': 40700}... -[2023-09-12 20:59:09,561][29523] Using port 41000 -[2023-09-12 20:59:09,561][29522] Initializing env for player 0, init_info: {'port': 40900}... -[2023-09-12 20:59:09,561][29521] Initializing env for player 0, init_info: {'port': 40800}... -[2023-09-12 20:59:09,562][29453] Port 40300 is available -[2023-09-12 20:59:09,562][29453] Using port 40300 -[2023-09-12 20:59:09,562][29486] Port 40500 is available -[2023-09-12 20:59:09,562][29523] Initializing env for player 0, init_info: {'port': 41000}... -[2023-09-12 20:59:09,562][29486] Using port 40500 -[2023-09-12 20:59:09,563][29453] Initializing env for player 0, init_info: {'port': 40300}... -[2023-09-12 20:59:09,564][29486] Initializing env for player 0, init_info: {'port': 40500}... -[2023-09-12 20:59:09,572][29485] Port 40400 is available -[2023-09-12 20:59:09,572][29485] Using port 40400 -[2023-09-12 20:59:09,573][29485] Initializing env for player 0, init_info: {'port': 40400}... -[2023-09-12 20:59:09,588][29519] Using port 40600 on host... -[2023-09-12 20:59:09,590][29520] Using port 40700 on host... -[2023-09-12 20:59:09,591][29522] Using port 40900 on host... -[2023-09-12 20:59:09,593][29523] Using port 41000 on host... -[2023-09-12 20:59:09,594][29486] Using port 40500 on host... -[2023-09-12 20:59:09,596][29521] Using port 40800 on host... -[2023-09-12 20:59:09,598][29453] Using port 40300 on host... -[2023-09-12 20:59:09,601][29485] Using port 40400 on host... -[2023-09-12 20:59:09,610][29519] Initializing env for player 1, init_info: {'port': 40600}... -[2023-09-12 20:59:09,611][29520] Initializing env for player 1, init_info: {'port': 40700}... -[2023-09-12 20:59:09,611][29521] Initializing env for player 1, init_info: {'port': 40800}... -[2023-09-12 20:59:09,612][29522] Initializing env for player 1, init_info: {'port': 40900}... -[2023-09-12 20:59:09,613][29523] Initializing env for player 1, init_info: {'port': 41000}... -[2023-09-12 20:59:09,613][29453] Initializing env for player 1, init_info: {'port': 40300}... -[2023-09-12 20:59:09,614][29486] Initializing env for player 1, init_info: {'port': 40500}... -[2023-09-12 20:59:09,623][29485] Initializing env for player 1, init_info: {'port': 40400}... -[2023-09-12 20:59:09,660][29519] Initializing env for player 2, init_info: {'port': 40600}... -[2023-09-12 20:59:09,662][29521] Initializing env for player 2, init_info: {'port': 40800}... -[2023-09-12 20:59:09,663][29520] Initializing env for player 2, init_info: {'port': 40700}... -[2023-09-12 20:59:09,665][29523] Initializing env for player 2, init_info: {'port': 41000}... -[2023-09-12 20:59:09,667][29453] Initializing env for player 2, init_info: {'port': 40300}... -[2023-09-12 20:59:09,669][29522] Initializing env for player 2, init_info: {'port': 40900}... -[2023-09-12 20:59:09,671][29486] Initializing env for player 2, init_info: {'port': 40500}... -[2023-09-12 20:59:09,674][29485] Initializing env for player 2, init_info: {'port': 40400}... -[2023-09-12 20:59:09,715][29520] Initializing env for player 3, init_info: {'port': 40700}... -[2023-09-12 20:59:09,715][29519] Initializing env for player 3, init_info: {'port': 40600}... -[2023-09-12 20:59:09,717][29453] Initializing env for player 3, init_info: {'port': 40300}... -[2023-09-12 20:59:09,719][29522] Initializing env for player 3, init_info: {'port': 40900}... -[2023-09-12 20:59:09,719][29523] Initializing env for player 3, init_info: {'port': 41000}... -[2023-09-12 20:59:09,721][29486] Initializing env for player 3, init_info: {'port': 40500}... -[2023-09-12 20:59:09,714][29521] Initializing env for player 3, init_info: {'port': 40800}... -[2023-09-12 20:59:09,731][29485] Initializing env for player 3, init_info: {'port': 40400}... -[2023-09-12 20:59:09,764][29519] Initializing env for player 4, init_info: {'port': 40600}... -[2023-09-12 20:59:09,764][29520] Initializing env for player 4, init_info: {'port': 40700}... -[2023-09-12 20:59:09,771][29521] Initializing env for player 4, init_info: {'port': 40800}... -[2023-09-12 20:59:09,771][29522] Initializing env for player 4, init_info: {'port': 40900}... -[2023-09-12 20:59:09,775][29486] Initializing env for player 4, init_info: {'port': 40500}... -[2023-09-12 20:59:09,785][29485] Initializing env for player 4, init_info: {'port': 40400}... -[2023-09-12 20:59:09,785][29523] Initializing env for player 4, init_info: {'port': 41000}... -[2023-09-12 20:59:09,807][29453] Initializing env for player 4, init_info: {'port': 40300}... -[2023-09-12 20:59:09,815][29520] Initializing env for player 5, init_info: {'port': 40700}... -[2023-09-12 20:59:09,816][29519] Initializing env for player 5, init_info: {'port': 40600}... -[2023-09-12 20:59:09,819][29453] Initializing env for player 5, init_info: {'port': 40300}... -[2023-09-12 20:59:09,819][29521] Initializing env for player 5, init_info: {'port': 40800}... -[2023-09-12 20:59:09,822][29522] Initializing env for player 5, init_info: {'port': 40900}... -[2023-09-12 20:59:09,828][29486] Initializing env for player 5, init_info: {'port': 40500}... -[2023-09-12 20:59:09,836][29485] Initializing env for player 5, init_info: {'port': 40400}... -[2023-09-12 20:59:09,838][29523] Initializing env for player 5, init_info: {'port': 41000}... -[2023-09-12 20:59:09,867][29519] Initializing env for player 6, init_info: {'port': 40600}... -[2023-09-12 20:59:09,867][29520] Initializing env for player 6, init_info: {'port': 40700}... -[2023-09-12 20:59:09,871][29453] Initializing env for player 6, init_info: {'port': 40300}... -[2023-09-12 20:59:09,875][29522] Initializing env for player 6, init_info: {'port': 40900}... -[2023-09-12 20:59:09,879][29521] Initializing env for player 6, init_info: {'port': 40800}... -[2023-09-12 20:59:09,886][29486] Initializing env for player 6, init_info: {'port': 40500}... -[2023-09-12 20:59:09,886][29523] Initializing env for player 6, init_info: {'port': 41000}... -[2023-09-12 20:59:09,890][29485] Initializing env for player 6, init_info: {'port': 40400}... -[2023-09-12 20:59:09,917][29520] Initializing env for player 7, init_info: {'port': 40700}... -[2023-09-12 20:59:09,923][29453] Initializing env for player 7, init_info: {'port': 40300}... -[2023-09-12 20:59:09,922][29519] Initializing env for player 7, init_info: {'port': 40600}... -[2023-09-12 20:59:09,924][29521] Initializing env for player 7, init_info: {'port': 40800}... -[2023-09-12 20:59:09,930][29486] Initializing env for player 7, init_info: {'port': 40500}... -[2023-09-12 20:59:09,931][29522] Initializing env for player 7, init_info: {'port': 40900}... -[2023-09-12 20:59:09,943][29523] Initializing env for player 7, init_info: {'port': 41000}... -[2023-09-12 20:59:09,945][29485] Initializing env for player 7, init_info: {'port': 40400}... -[2023-09-12 20:59:11,447][29523] Initialized w:7 v:0 player:1 -[2023-09-12 20:59:11,450][29523] Initialized w:7 v:0 player:6 -[2023-09-12 20:59:11,450][29522] Initialized w:6 v:0 player:3 -[2023-09-12 20:59:11,450][29523] Initialized w:7 v:0 player:4 -[2023-09-12 20:59:11,450][29523] Initialized w:7 v:0 player:2 -[2023-09-12 20:59:11,451][29523] Initialized w:7 v:0 player:7 -[2023-09-12 20:59:11,451][29523] Initialized w:7 v:0 player:0 -[2023-09-12 20:59:11,451][29523] Initialized w:7 v:0 player:3 -[2023-09-12 20:59:11,451][29523] Initialized w:7 v:0 player:5 -[2023-09-12 20:59:11,454][29523] 8 agent workers initialized for env 7! -[2023-09-12 20:59:11,455][29522] Initialized w:6 v:0 player:2 -[2023-09-12 20:59:11,456][29522] Initialized w:6 v:0 player:6 -[2023-09-12 20:59:11,457][29522] Initialized w:6 v:0 player:1 -[2023-09-12 20:59:11,457][29522] Initialized w:6 v:0 player:0 -[2023-09-12 20:59:11,457][29522] Initialized w:6 v:0 player:5 -[2023-09-12 20:59:11,457][29522] Initialized w:6 v:0 player:4 -[2023-09-12 20:59:11,504][29523] Decorrelating experience for 0 frames... -[2023-09-12 20:59:11,506][29523] Port 41001 is available -[2023-09-12 20:59:11,506][29523] Using port 41001 -[2023-09-12 20:59:11,507][29523] Initializing env for player 0, init_info: {'port': 41001}... -[2023-09-12 20:59:11,514][29519] Initialized w:3 v:0 player:7 -[2023-09-12 20:59:11,515][29519] Initialized w:3 v:0 player:0 -[2023-09-12 20:59:11,517][29519] Initialized w:3 v:0 player:1 -[2023-09-12 20:59:11,518][29519] Initialized w:3 v:0 player:4 -[2023-09-12 20:59:11,518][29519] Initialized w:3 v:0 player:2 -[2023-09-12 20:59:11,518][29519] Initialized w:3 v:0 player:6 -[2023-09-12 20:59:11,519][29519] Initialized w:3 v:0 player:3 -[2023-09-12 20:59:11,523][29519] Initialized w:3 v:0 player:5 -[2023-09-12 20:59:11,524][29519] 8 agent workers initialized for env 3! -[2023-09-12 20:59:11,531][29521] Initialized w:5 v:0 player:2 -[2023-09-12 20:59:11,532][29521] Initialized w:5 v:0 player:4 -[2023-09-12 20:59:11,533][29521] Initialized w:5 v:0 player:6 -[2023-09-12 20:59:11,533][29521] Initialized w:5 v:0 player:0 -[2023-09-12 20:59:11,533][29521] Initialized w:5 v:0 player:3 -[2023-09-12 20:59:11,534][29521] Initialized w:5 v:0 player:5 -[2023-09-12 20:59:11,535][29521] Initialized w:5 v:0 player:7 -[2023-09-12 20:59:11,537][29521] Initialized w:5 v:0 player:1 -[2023-09-12 20:59:11,538][29521] 8 agent workers initialized for env 5! -[2023-09-12 20:59:11,547][29523] Using port 41001 on host... -[2023-09-12 20:59:11,557][29523] Initializing env for player 1, init_info: {'port': 41001}... -[2023-09-12 20:59:11,572][29519] Decorrelating experience for 0 frames... -[2023-09-12 20:59:11,568][29520] Initialized w:4 v:0 player:4 -[2023-09-12 20:59:11,574][29519] Port 40601 is available -[2023-09-12 20:59:11,575][29519] Using port 40601 -[2023-09-12 20:59:11,578][29520] Initialized w:4 v:0 player:6 -[2023-09-12 20:59:11,576][29520] Initialized w:4 v:0 player:7 -[2023-09-12 20:59:11,576][29520] Initialized w:4 v:0 player:1 -[2023-09-12 20:59:11,577][29520] Initialized w:4 v:0 player:5 -[2023-09-12 20:59:11,577][29520] Initialized w:4 v:0 player:2 -[2023-09-12 20:59:11,577][29520] Initialized w:4 v:0 player:0 -[2023-09-12 20:59:11,574][29520] Initialized w:4 v:0 player:3 -[2023-09-12 20:59:11,582][29520] 8 agent workers initialized for env 4! -[2023-09-12 20:59:11,585][29485] Initialized w:1 v:0 player:1 -[2023-09-12 20:59:11,587][29485] Initialized w:1 v:0 player:6 -[2023-09-12 20:59:11,588][29485] Initialized w:1 v:0 player:3 -[2023-09-12 20:59:11,588][29485] Initialized w:1 v:0 player:7 -[2023-09-12 20:59:11,588][29485] Initialized w:1 v:0 player:5 -[2023-09-12 20:59:11,589][29485] Initialized w:1 v:0 player:0 -[2023-09-12 20:59:11,589][29485] Initialized w:1 v:0 player:2 -[2023-09-12 20:59:11,590][29485] Initialized w:1 v:0 player:4 -[2023-09-12 20:59:11,591][29485] 8 agent workers initialized for env 1! -[2023-09-12 20:59:11,596][29521] Decorrelating experience for 0 frames... -[2023-09-12 20:59:11,598][29521] Port 40801 is available -[2023-09-12 20:59:11,598][29521] Using port 40801 -[2023-09-12 20:59:11,604][29453] Initialized w:0 v:0 player:7 -[2023-09-12 20:59:11,606][29453] Initialized w:0 v:0 player:0 -[2023-09-12 20:59:11,606][29453] Initialized w:0 v:0 player:3 -[2023-09-12 20:59:11,608][29523] Initializing env for player 2, init_info: {'port': 41001}... -[2023-09-12 20:59:11,606][29453] Initialized w:0 v:0 player:6 -[2023-09-12 20:59:11,606][29453] Initialized w:0 v:0 player:4 -[2023-09-12 20:59:11,606][29453] Initialized w:0 v:0 player:2 -[2023-09-12 20:59:11,606][29453] Initialized w:0 v:0 player:1 -[2023-09-12 20:59:11,607][29453] Initialized w:0 v:0 player:5 -[2023-09-12 20:59:11,611][29453] 8 agent workers initialized for env 0! -[2023-09-12 20:59:11,635][29485] Decorrelating experience for 0 frames... -[2023-09-12 20:59:11,637][29485] Port 40401 is available -[2023-09-12 20:59:11,637][29485] Using port 40401 -[2023-09-12 20:59:11,639][29486] Initialized w:2 v:0 player:0 -[2023-09-12 20:59:11,640][29486] Initialized w:2 v:0 player:1 -[2023-09-12 20:59:11,641][29486] Initialized w:2 v:0 player:4 -[2023-09-12 20:59:11,641][29486] Initialized w:2 v:0 player:3 -[2023-09-12 20:59:11,642][29486] Initialized w:2 v:0 player:6 -[2023-09-12 20:59:11,643][29486] Initialized w:2 v:0 player:2 -[2023-09-12 20:59:11,644][29486] Initialized w:2 v:0 player:7 -[2023-09-12 20:59:11,644][29520] Decorrelating experience for 0 frames... -[2023-09-12 20:59:11,644][29486] Initialized w:2 v:0 player:5 -[2023-09-12 20:59:11,645][29486] 8 agent workers initialized for env 2! -[2023-09-12 20:59:11,646][29520] Port 40701 is available -[2023-09-12 20:59:11,646][29520] Using port 40701 -[2023-09-12 20:59:11,647][29520] Initializing env for player 0, init_info: {'port': 40701}... -[2023-09-12 20:59:11,649][29521] Initializing env for player 0, init_info: {'port': 40801}... -[2023-09-12 20:59:11,654][29453] Decorrelating experience for 0 frames... -[2023-09-12 20:59:11,656][29453] Port 40301 is available -[2023-09-12 20:59:11,656][29453] Using port 40301 -[2023-09-12 20:59:11,656][29453] Initializing env for player 0, init_info: {'port': 40301}... -[2023-09-12 20:59:11,658][29523] Initializing env for player 3, init_info: {'port': 41001}... -[2023-09-12 20:59:11,677][29520] Using port 40701 on host... -[2023-09-12 20:59:11,679][29521] Using port 40801 on host... -[2023-09-12 20:59:11,684][29453] Using port 40301 on host... -[2023-09-12 20:59:11,697][29520] Initializing env for player 1, init_info: {'port': 40701}... -[2023-09-12 20:59:11,699][29521] Initializing env for player 1, init_info: {'port': 40801}... -[2023-09-12 20:59:11,704][29486] Decorrelating experience for 0 frames... -[2023-09-12 20:59:11,706][29486] Port 40501 is available -[2023-09-12 20:59:11,707][29486] Using port 40501 -[2023-09-12 20:59:11,707][29453] Initializing env for player 1, init_info: {'port': 40301}... -[2023-09-12 20:59:11,715][29523] Initializing env for player 4, init_info: {'port': 41001}... -[2023-09-12 20:59:11,748][29520] Initializing env for player 2, init_info: {'port': 40701}... -[2023-09-12 20:59:11,749][29521] Initializing env for player 2, init_info: {'port': 40801}... -[2023-09-12 20:59:11,757][29453] Initializing env for player 2, init_info: {'port': 40301}... -[2023-09-12 20:59:11,767][29523] Initializing env for player 5, init_info: {'port': 41001}... -[2023-09-12 20:59:11,798][29520] Initializing env for player 3, init_info: {'port': 40701}... -[2023-09-12 20:59:11,801][29521] Initializing env for player 3, init_info: {'port': 40801}... -[2023-09-12 20:59:11,807][29453] Initializing env for player 3, init_info: {'port': 40301}... -[2023-09-12 20:59:11,815][29523] Initializing env for player 6, init_info: {'port': 41001}... -[2023-09-12 20:59:11,848][29520] Initializing env for player 4, init_info: {'port': 40701}... -[2023-09-12 20:59:11,853][29521] Initializing env for player 4, init_info: {'port': 40801}... -[2023-09-12 20:59:11,863][29453] Initializing env for player 4, init_info: {'port': 40301}... -[2023-09-12 20:59:11,867][29523] Initializing env for player 7, init_info: {'port': 41001}... -[2023-09-12 20:59:11,899][29520] Initializing env for player 5, init_info: {'port': 40701}... -[2023-09-12 20:59:11,907][29521] Initializing env for player 5, init_info: {'port': 40801}... -[2023-09-12 20:59:11,912][29453] Initializing env for player 5, init_info: {'port': 40301}... -[2023-09-12 20:59:11,963][29521] Initializing env for player 6, init_info: {'port': 40801}... -[2023-09-12 20:59:11,963][29520] Initializing env for player 6, init_info: {'port': 40701}... -[2023-09-12 20:59:11,967][29453] Initializing env for player 6, init_info: {'port': 40301}... -[2023-09-12 20:59:12,011][29520] Initializing env for player 7, init_info: {'port': 40701}... -[2023-09-12 20:59:12,027][29521] Initializing env for player 7, init_info: {'port': 40801}... -[2023-09-12 20:59:12,039][29453] Initializing env for player 7, init_info: {'port': 40301}... -[2023-09-12 20:59:12,448][29522] Initialized w:6 v:0 player:7 -[2023-09-12 20:59:12,450][29522] 8 agent workers initialized for env 6! -[2023-09-12 20:59:12,496][29485] Initializing env for player 0, init_info: {'port': 40401}... -[2023-09-12 20:59:12,524][29522] Decorrelating experience for 0 frames... -[2023-09-12 20:59:12,525][29522] Port 40901 is available -[2023-09-12 20:59:12,525][29522] Using port 40901 -[2023-09-12 20:59:12,526][29522] Initializing env for player 0, init_info: {'port': 40901}... -[2023-09-12 20:59:12,534][29485] Using port 40401 on host... -[2023-09-12 20:59:12,546][29485] Initializing env for player 1, init_info: {'port': 40401}... -[2023-09-12 20:59:12,555][29522] Using port 40901 on host... -[2023-09-12 20:59:12,576][29522] Initializing env for player 1, init_info: {'port': 40901}... -[2023-09-12 20:59:12,597][29485] Initializing env for player 2, init_info: {'port': 40401}... -[2023-09-12 20:59:12,627][29522] Initializing env for player 2, init_info: {'port': 40901}... -[2023-09-12 20:59:12,655][29485] Initializing env for player 3, init_info: {'port': 40401}... -[2023-09-12 20:59:12,677][29522] Initializing env for player 3, init_info: {'port': 40901}... -[2023-09-12 20:59:12,703][29485] Initializing env for player 4, init_info: {'port': 40401}... -[2023-09-12 20:59:12,735][29522] Initializing env for player 4, init_info: {'port': 40901}... -[2023-09-12 20:59:12,759][29485] Initializing env for player 5, init_info: {'port': 40401}... -[2023-09-12 20:59:12,803][29522] Initializing env for player 5, init_info: {'port': 40901}... -[2023-09-12 20:59:12,813][29485] Initializing env for player 6, init_info: {'port': 40401}... -[2023-09-12 20:59:12,852][29522] Initializing env for player 6, init_info: {'port': 40901}... -[2023-09-12 20:59:12,858][29485] Initializing env for player 7, init_info: {'port': 40401}... -[2023-09-12 20:59:12,903][29522] Initializing env for player 7, init_info: {'port': 40901}... -[2023-09-12 20:59:13,236][29523] Initialized w:7 v:1 player:7 -[2023-09-12 20:59:13,238][29523] Initialized w:7 v:1 player:1 -[2023-09-12 20:59:13,238][29523] Initialized w:7 v:1 player:6 -[2023-09-12 20:59:13,238][29523] Initialized w:7 v:1 player:4 -[2023-09-12 20:59:13,238][29523] Initialized w:7 v:1 player:2 -[2023-09-12 20:59:13,239][29523] Initialized w:7 v:1 player:0 -[2023-09-12 20:59:13,239][29523] Initialized w:7 v:1 player:3 -[2023-09-12 20:59:13,239][29523] Initialized w:7 v:1 player:5 -[2023-09-12 20:59:13,242][29523] 8 agent workers initialized for env 7! -[2023-09-12 20:59:13,259][29519] Initializing env for player 0, init_info: {'port': 40601}... -[2023-09-12 20:59:13,288][29523] Decorrelating experience for 32 frames... -[2023-09-12 20:59:13,300][29519] Using port 40601 on host... -[2023-09-12 20:59:13,310][29519] Initializing env for player 1, init_info: {'port': 40601}... -[2023-09-12 20:59:13,352][29521] Initialized w:5 v:1 player:3 -[2023-09-12 20:59:13,352][29521] Initialized w:5 v:1 player:1 -[2023-09-12 20:59:13,352][29521] Initialized w:5 v:1 player:2 -[2023-09-12 20:59:13,353][29521] Initialized w:5 v:1 player:4 -[2023-09-12 20:59:13,353][29521] Initialized w:5 v:1 player:0 -[2023-09-12 20:59:13,353][29521] Initialized w:5 v:1 player:5 -[2023-09-12 20:59:13,353][29521] Initialized w:5 v:1 player:6 -[2023-09-12 20:59:13,353][29521] Initialized w:5 v:1 player:7 -[2023-09-12 20:59:13,356][29521] 8 agent workers initialized for env 5! -[2023-09-12 20:59:13,360][29519] Initializing env for player 2, init_info: {'port': 40601}... -[2023-09-12 20:59:13,395][29486] Initializing env for player 0, init_info: {'port': 40501}... -[2023-09-12 20:59:13,399][29521] Decorrelating experience for 32 frames... -[2023-09-12 20:59:13,410][29519] Initializing env for player 3, init_info: {'port': 40601}... -[2023-09-12 20:59:13,427][29486] Using port 40501 on host... -[2023-09-12 20:59:13,446][29486] Initializing env for player 1, init_info: {'port': 40501}... -[2023-09-12 20:59:13,467][29519] Initializing env for player 4, init_info: {'port': 40601}... -[2023-09-12 20:59:13,495][29453] Initialized w:0 v:1 player:0 -[2023-09-12 20:59:13,498][29453] Initialized w:0 v:1 player:7 -[2023-09-12 20:59:13,499][29453] Initialized w:0 v:1 player:6 -[2023-09-12 20:59:13,499][29486] Initializing env for player 2, init_info: {'port': 40501}... -[2023-09-12 20:59:13,499][29453] Initialized w:0 v:1 player:2 -[2023-09-12 20:59:13,499][29453] Initialized w:0 v:1 player:4 -[2023-09-12 20:59:13,499][29453] Initialized w:0 v:1 player:5 -[2023-09-12 20:59:13,503][29453] Initialized w:0 v:1 player:1 -[2023-09-12 20:59:13,519][29519] Initializing env for player 5, init_info: {'port': 40601}... -[2023-09-12 20:59:13,538][29520] Initialized w:4 v:1 player:5 -[2023-09-12 20:59:13,539][29520] Initialized w:4 v:1 player:4 -[2023-09-12 20:59:13,540][29520] Initialized w:4 v:1 player:2 -[2023-09-12 20:59:13,540][29520] Initialized w:4 v:1 player:1 -[2023-09-12 20:59:13,541][29520] Initialized w:4 v:1 player:6 -[2023-09-12 20:59:13,542][29520] Initialized w:4 v:1 player:7 -[2023-09-12 20:59:13,542][29520] Initialized w:4 v:1 player:0 -[2023-09-12 20:59:13,551][29520] Initialized w:4 v:1 player:3 -[2023-09-12 20:59:13,552][29486] Initializing env for player 3, init_info: {'port': 40501}... -[2023-09-12 20:59:13,553][29520] 8 agent workers initialized for env 4! -[2023-09-12 20:59:13,587][29519] Initializing env for player 6, init_info: {'port': 40601}... -[2023-09-12 20:59:13,591][29520] Decorrelating experience for 32 frames... -[2023-09-12 20:59:13,617][29486] Initializing env for player 4, init_info: {'port': 40501}... -[2023-09-12 20:59:13,637][29519] Initializing env for player 7, init_info: {'port': 40601}... -[2023-09-12 20:59:13,675][29486] Initializing env for player 5, init_info: {'port': 40501}... -[2023-09-12 20:59:13,708][29523] Multi agent env, num agents: 8 -[2023-09-12 20:59:13,727][29486] Initializing env for player 6, init_info: {'port': 40501}... -[2023-09-12 20:59:13,755][29523] Multi agent env, num agents: 8 -[2023-09-12 20:59:13,779][29486] Initializing env for player 7, init_info: {'port': 40501}... -[2023-09-12 20:59:13,802][29523] Port 41002 is available -[2023-09-12 20:59:13,802][29523] Using port 41002 -[2023-09-12 20:59:13,803][29523] Initializing env for player 0, init_info: {'port': 41002}... -[2023-09-12 20:59:13,825][29521] Multi agent env, num agents: 8 -[2023-09-12 20:59:13,848][29523] Using port 41002 on host... -[2023-09-12 20:59:13,857][29521] Multi agent env, num agents: 8 -[2023-09-12 20:59:13,859][29523] Initializing env for player 1, init_info: {'port': 41002}... -[2023-09-12 20:59:13,889][29521] Port 40802 is available -[2023-09-12 20:59:13,889][29521] Using port 40802 -[2023-09-12 20:59:13,890][29521] Initializing env for player 0, init_info: {'port': 40802}... -[2023-09-12 20:59:13,917][29523] Initializing env for player 2, init_info: {'port': 41002}... -[2023-09-12 20:59:13,920][29521] Using port 40802 on host... -[2023-09-12 20:59:13,933][29520] Multi agent env, num agents: 8 -[2023-09-12 20:59:13,941][29521] Initializing env for player 1, init_info: {'port': 40802}... -[2023-09-12 20:59:13,965][29520] Multi agent env, num agents: 8 -[2023-09-12 20:59:13,975][29523] Initializing env for player 3, init_info: {'port': 41002}... -[2023-09-12 20:59:13,995][29521] Initializing env for player 2, init_info: {'port': 40802}... -[2023-09-12 20:59:13,997][29520] Port 40702 is available -[2023-09-12 20:59:13,998][29520] Using port 40702 -[2023-09-12 20:59:13,998][29520] Initializing env for player 0, init_info: {'port': 40702}... -[2023-09-12 20:59:14,031][29520] Using port 40702 on host... -[2023-09-12 20:59:14,039][29523] Initializing env for player 4, init_info: {'port': 41002}... -[2023-09-12 20:59:14,043][29521] Initializing env for player 3, init_info: {'port': 40802}... -[2023-09-12 20:59:14,049][29520] Initializing env for player 1, init_info: {'port': 40702}... -[2023-09-12 20:59:14,091][29523] Initializing env for player 5, init_info: {'port': 41002}... -[2023-09-12 20:59:14,099][29521] Initializing env for player 4, init_info: {'port': 40802}... -[2023-09-12 20:59:14,099][29520] Initializing env for player 2, init_info: {'port': 40702}... -[2023-09-12 20:59:14,131][29485] Initialized w:1 v:1 player:4 -[2023-09-12 20:59:14,132][29485] Initialized w:1 v:1 player:3 -[2023-09-12 20:59:14,134][29485] Initialized w:1 v:1 player:7 -[2023-09-12 20:59:14,134][29485] Initialized w:1 v:1 player:5 -[2023-09-12 20:59:14,135][29485] Initialized w:1 v:1 player:0 -[2023-09-12 20:59:14,135][29485] Initialized w:1 v:1 player:6 -[2023-09-12 20:59:14,136][29485] Initialized w:1 v:1 player:2 -[2023-09-12 20:59:14,136][29485] Initialized w:1 v:1 player:1 -[2023-09-12 20:59:14,138][29485] 8 agent workers initialized for env 1! -[2023-09-12 20:59:14,153][29521] Initializing env for player 5, init_info: {'port': 40802}... -[2023-09-12 20:59:14,156][29520] Initializing env for player 3, init_info: {'port': 40702}... -[2023-09-12 20:59:14,159][29523] Initializing env for player 6, init_info: {'port': 41002}... -[2023-09-12 20:59:14,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 20:59:14,207][29520] Initializing env for player 4, init_info: {'port': 40702}... -[2023-09-12 20:59:14,212][29522] Initialized w:6 v:1 player:0 -[2023-09-12 20:59:14,214][29522] Initialized w:6 v:1 player:2 -[2023-09-12 20:59:14,214][29522] Initialized w:6 v:1 player:1 -[2023-09-12 20:59:14,214][29522] Initialized w:6 v:1 player:6 -[2023-09-12 20:59:14,216][29485] Decorrelating experience for 32 frames... -[2023-09-12 20:59:14,216][29522] Initialized w:6 v:1 player:4 -[2023-09-12 20:59:14,215][29522] Initialized w:6 v:1 player:7 -[2023-09-12 20:59:14,217][29522] Initialized w:6 v:1 player:3 -[2023-09-12 20:59:14,218][29522] Initialized w:6 v:1 player:5 -[2023-09-12 20:59:14,219][29522] 8 agent workers initialized for env 6! -[2023-09-12 20:59:14,222][29521] Initializing env for player 6, init_info: {'port': 40802}... -[2023-09-12 20:59:14,227][29523] Initializing env for player 7, init_info: {'port': 41002}... -[2023-09-12 20:59:14,259][29520] Initializing env for player 5, init_info: {'port': 40702}... -[2023-09-12 20:59:14,310][29520] Initializing env for player 6, init_info: {'port': 40702}... -[2023-09-12 20:59:14,311][29521] Initializing env for player 7, init_info: {'port': 40802}... -[2023-09-12 20:59:14,320][29522] Decorrelating experience for 32 frames... -[2023-09-12 20:59:14,363][29520] Initializing env for player 7, init_info: {'port': 40702}... -[2023-09-12 20:59:14,495][29453] Initialized w:0 v:1 player:3 -[2023-09-12 20:59:14,496][29453] 8 agent workers initialized for env 0! -[2023-09-12 20:59:14,588][29453] Decorrelating experience for 32 frames... -[2023-09-12 20:59:14,920][29522] Multi agent env, num agents: 8 -[2023-09-12 20:59:14,967][29522] Multi agent env, num agents: 8 -[2023-09-12 20:59:15,013][29485] Multi agent env, num agents: 8 -[2023-09-12 20:59:15,014][29522] Port 40902 is available -[2023-09-12 20:59:15,015][29522] Using port 40902 -[2023-09-12 20:59:15,015][29522] Initializing env for player 0, init_info: {'port': 40902}... -[2023-09-12 20:59:15,026][29453] Multi agent env, num agents: 8 -[2023-09-12 20:59:15,044][29485] Multi agent env, num agents: 8 -[2023-09-12 20:59:15,047][29522] Using port 40902 on host... -[2023-09-12 20:59:15,056][29453] Multi agent env, num agents: 8 -[2023-09-12 20:59:15,066][29522] Initializing env for player 1, init_info: {'port': 40902}... -[2023-09-12 20:59:15,076][29485] Port 40402 is available -[2023-09-12 20:59:15,077][29485] Using port 40402 -[2023-09-12 20:59:15,078][29485] Initializing env for player 0, init_info: {'port': 40402}... -[2023-09-12 20:59:15,087][29453] Port 40302 is available -[2023-09-12 20:59:15,087][29453] Using port 40302 -[2023-09-12 20:59:15,088][29453] Initializing env for player 0, init_info: {'port': 40302}... -[2023-09-12 20:59:15,106][29485] Using port 40402 on host... -[2023-09-12 20:59:15,116][29522] Initializing env for player 2, init_info: {'port': 40902}... -[2023-09-12 20:59:15,120][29453] Using port 40302 on host... -[2023-09-12 20:59:15,128][29485] Initializing env for player 1, init_info: {'port': 40402}... -[2023-09-12 20:59:15,139][29453] Initializing env for player 1, init_info: {'port': 40302}... -[2023-09-12 20:59:15,160][29519] Initialized w:3 v:1 player:3 -[2023-09-12 20:59:15,163][29519] Initialized w:3 v:1 player:0 -[2023-09-12 20:59:15,163][29519] Initialized w:3 v:1 player:1 -[2023-09-12 20:59:15,163][29519] Initialized w:3 v:1 player:5 -[2023-09-12 20:59:15,164][29519] Initialized w:3 v:1 player:7 -[2023-09-12 20:59:15,164][29519] Initialized w:3 v:1 player:2 -[2023-09-12 20:59:15,164][29519] Initialized w:3 v:1 player:4 -[2023-09-12 20:59:15,165][29519] Initialized w:3 v:1 player:6 -[2023-09-12 20:59:15,167][29519] 8 agent workers initialized for env 3! -[2023-09-12 20:59:15,174][29522] Initializing env for player 3, init_info: {'port': 40902}... -[2023-09-12 20:59:15,178][29485] Initializing env for player 2, init_info: {'port': 40402}... -[2023-09-12 20:59:15,191][29453] Initializing env for player 2, init_info: {'port': 40302}... -[2023-09-12 20:59:15,221][29519] Decorrelating experience for 32 frames... -[2023-09-12 20:59:15,223][29522] Initializing env for player 4, init_info: {'port': 40902}... -[2023-09-12 20:59:15,237][29485] Initializing env for player 3, init_info: {'port': 40402}... -[2023-09-12 20:59:15,241][29453] Initializing env for player 3, init_info: {'port': 40302}... -[2023-09-12 20:59:15,279][29522] Initializing env for player 5, init_info: {'port': 40902}... -[2023-09-12 20:59:15,292][29453] Initializing env for player 4, init_info: {'port': 40302}... -[2023-09-12 20:59:15,293][29485] Initializing env for player 4, init_info: {'port': 40402}... -[2023-09-12 20:59:15,319][29486] Initialized w:2 v:1 player:1 -[2023-09-12 20:59:15,319][29486] Initialized w:2 v:1 player:7 -[2023-09-12 20:59:15,320][29486] Initialized w:2 v:1 player:6 -[2023-09-12 20:59:15,321][29486] Initialized w:2 v:1 player:4 -[2023-09-12 20:59:15,321][29486] Initialized w:2 v:1 player:2 -[2023-09-12 20:59:15,323][29486] Initialized w:2 v:1 player:5 -[2023-09-12 20:59:15,324][29486] Initialized w:2 v:1 player:0 -[2023-09-12 20:59:15,326][29486] Initialized w:2 v:1 player:3 -[2023-09-12 20:59:15,327][29486] 8 agent workers initialized for env 2! -[2023-09-12 20:59:15,347][29485] Initializing env for player 5, init_info: {'port': 40402}... -[2023-09-12 20:59:15,355][29522] Initializing env for player 6, init_info: {'port': 40902}... -[2023-09-12 20:59:15,357][29453] Initializing env for player 5, init_info: {'port': 40302}... -[2023-09-12 20:59:15,387][29522] Initializing env for player 7, init_info: {'port': 40902}... -[2023-09-12 20:59:15,399][29485] Initializing env for player 6, init_info: {'port': 40402}... -[2023-09-12 20:59:15,402][29486] Decorrelating experience for 32 frames... -[2023-09-12 20:59:15,415][29453] Initializing env for player 6, init_info: {'port': 40302}... -[2023-09-12 20:59:15,463][29485] Initializing env for player 7, init_info: {'port': 40402}... -[2023-09-12 20:59:15,468][29453] Initializing env for player 7, init_info: {'port': 40302}... -[2023-09-12 20:59:15,599][29523] Initialized w:7 v:2 player:5 -[2023-09-12 20:59:15,602][29523] Initialized w:7 v:2 player:2 -[2023-09-12 20:59:15,603][29523] Initialized w:7 v:2 player:0 -[2023-09-12 20:59:15,604][29523] Initialized w:7 v:2 player:1 -[2023-09-12 20:59:15,605][29523] Initialized w:7 v:2 player:7 -[2023-09-12 20:59:15,605][29523] Initialized w:7 v:2 player:4 -[2023-09-12 20:59:15,606][29523] Initialized w:7 v:2 player:3 -[2023-09-12 20:59:15,607][29523] Initialized w:7 v:2 player:6 -[2023-09-12 20:59:15,608][29523] 8 agent workers initialized for env 7! -[2023-09-12 20:59:15,703][29523] Decorrelating experience for 64 frames... -[2023-09-12 20:59:15,790][29520] Initialized w:4 v:2 player:1 -[2023-09-12 20:59:15,793][29520] Initialized w:4 v:2 player:6 -[2023-09-12 20:59:15,794][29520] Initialized w:4 v:2 player:0 -[2023-09-12 20:59:15,795][29520] Initialized w:4 v:2 player:2 -[2023-09-12 20:59:15,796][29520] Initialized w:4 v:2 player:5 -[2023-09-12 20:59:15,797][29520] Initialized w:4 v:2 player:3 -[2023-09-12 20:59:15,804][29520] Initialized w:4 v:2 player:7 -[2023-09-12 20:59:15,804][29520] Initialized w:4 v:2 player:4 -[2023-09-12 20:59:15,805][29520] 8 agent workers initialized for env 4! -[2023-09-12 20:59:15,861][29520] Decorrelating experience for 64 frames... -[2023-09-12 20:59:15,862][29521] Initialized w:5 v:2 player:4 -[2023-09-12 20:59:15,864][29521] Initialized w:5 v:2 player:5 -[2023-09-12 20:59:15,863][29521] Initialized w:5 v:2 player:0 -[2023-09-12 20:59:15,863][29521] Initialized w:5 v:2 player:2 -[2023-09-12 20:59:15,864][29521] Initialized w:5 v:2 player:6 -[2023-09-12 20:59:15,865][29521] Initialized w:5 v:2 player:1 -[2023-09-12 20:59:15,868][29521] Initialized w:5 v:2 player:7 -[2023-09-12 20:59:15,868][29521] Initialized w:5 v:2 player:3 -[2023-09-12 20:59:15,869][29521] 8 agent workers initialized for env 5! -[2023-09-12 20:59:15,929][29521] Decorrelating experience for 64 frames... -[2023-09-12 20:59:16,046][29486] Multi agent env, num agents: 8 -[2023-09-12 20:59:16,050][29519] Multi agent env, num agents: 8 -[2023-09-12 20:59:16,078][29486] Multi agent env, num agents: 8 -[2023-09-12 20:59:16,097][29519] Multi agent env, num agents: 8 -[2023-09-12 20:59:16,109][29486] Port 40502 is available -[2023-09-12 20:59:16,109][29486] Using port 40502 -[2023-09-12 20:59:16,110][29486] Initializing env for player 0, init_info: {'port': 40502}... -[2023-09-12 20:59:16,145][29486] Using port 40502 on host... -[2023-09-12 20:59:16,147][29519] Port 40602 is available -[2023-09-12 20:59:16,147][29519] Using port 40602 -[2023-09-12 20:59:16,148][29519] Initializing env for player 0, init_info: {'port': 40602}... -[2023-09-12 20:59:16,161][29486] Initializing env for player 1, init_info: {'port': 40502}... -[2023-09-12 20:59:16,193][29519] Using port 40602 on host... -[2023-09-12 20:59:16,204][29519] Initializing env for player 1, init_info: {'port': 40602}... -[2023-09-12 20:59:16,212][29486] Initializing env for player 2, init_info: {'port': 40502}... -[2023-09-12 20:59:16,261][29486] Initializing env for player 3, init_info: {'port': 40502}... -[2023-09-12 20:59:16,266][29519] Initializing env for player 2, init_info: {'port': 40602}... -[2023-09-12 20:59:16,316][29519] Initializing env for player 3, init_info: {'port': 40602}... -[2023-09-12 20:59:16,313][29486] Initializing env for player 4, init_info: {'port': 40502}... -[2023-09-12 20:59:16,367][29486] Initializing env for player 5, init_info: {'port': 40502}... -[2023-09-12 20:59:16,381][29519] Initializing env for player 4, init_info: {'port': 40602}... -[2023-09-12 20:59:16,419][29486] Initializing env for player 6, init_info: {'port': 40502}... -[2023-09-12 20:59:16,435][29519] Initializing env for player 5, init_info: {'port': 40602}... -[2023-09-12 20:59:16,467][29486] Initializing env for player 7, init_info: {'port': 40502}... -[2023-09-12 20:59:16,488][29519] Initializing env for player 6, init_info: {'port': 40602}... -[2023-09-12 20:59:16,547][29519] Initializing env for player 7, init_info: {'port': 40602}... -[2023-09-12 20:59:16,570][29520] Port 40703 is available -[2023-09-12 20:59:16,570][29520] Using port 40703 -[2023-09-12 20:59:16,571][29520] Initializing env for player 0, init_info: {'port': 40703}... -[2023-09-12 20:59:16,601][29520] Using port 40703 on host... -[2023-09-12 20:59:16,604][29521] Port 40803 is available -[2023-09-12 20:59:16,605][29521] Using port 40803 -[2023-09-12 20:59:16,605][29521] Initializing env for player 0, init_info: {'port': 40803}... -[2023-09-12 20:59:16,621][29520] Initializing env for player 1, init_info: {'port': 40703}... -[2023-09-12 20:59:16,634][29521] Using port 40803 on host... -[2023-09-12 20:59:16,656][29521] Initializing env for player 1, init_info: {'port': 40803}... -[2023-09-12 20:59:16,672][29520] Initializing env for player 2, init_info: {'port': 40703}... -[2023-09-12 20:59:16,707][29521] Initializing env for player 2, init_info: {'port': 40803}... -[2023-09-12 20:59:16,715][29523] Port 41003 is available -[2023-09-12 20:59:16,715][29523] Using port 41003 -[2023-09-12 20:59:16,715][29523] Initializing env for player 0, init_info: {'port': 41003}... -[2023-09-12 20:59:16,722][29520] Initializing env for player 3, init_info: {'port': 40703}... -[2023-09-12 20:59:16,757][29521] Initializing env for player 3, init_info: {'port': 40803}... -[2023-09-12 20:59:16,761][29523] Using port 41003 on host... -[2023-09-12 20:59:16,775][29523] Initializing env for player 1, init_info: {'port': 41003}... -[2023-09-12 20:59:16,787][29520] Initializing env for player 4, init_info: {'port': 40703}... -[2023-09-12 20:59:16,827][29523] Initializing env for player 2, init_info: {'port': 41003}... -[2023-09-12 20:59:16,828][29521] Initializing env for player 4, init_info: {'port': 40803}... -[2023-09-12 20:59:16,839][29520] Initializing env for player 5, init_info: {'port': 40703}... -[2023-09-12 20:59:16,874][29522] Initialized w:6 v:2 player:3 -[2023-09-12 20:59:16,878][29523] Initializing env for player 3, init_info: {'port': 41003}... -[2023-09-12 20:59:16,884][29521] Initializing env for player 5, init_info: {'port': 40803}... -[2023-09-12 20:59:16,888][29522] Initialized w:6 v:2 player:7 -[2023-09-12 20:59:16,888][29522] Initialized w:6 v:2 player:1 -[2023-09-12 20:59:16,890][29522] Initialized w:6 v:2 player:5 -[2023-09-12 20:59:16,890][29522] Initialized w:6 v:2 player:4 -[2023-09-12 20:59:16,893][29522] Initialized w:6 v:2 player:0 -[2023-09-12 20:59:16,895][29520] Initializing env for player 6, init_info: {'port': 40703}... -[2023-09-12 20:59:16,894][29522] Initialized w:6 v:2 player:2 -[2023-09-12 20:59:16,895][29522] Initialized w:6 v:2 player:6 -[2023-09-12 20:59:16,897][29522] 8 agent workers initialized for env 6! -[2023-09-12 20:59:16,930][29523] Initializing env for player 4, init_info: {'port': 41003}... -[2023-09-12 20:59:16,939][29521] Initializing env for player 6, init_info: {'port': 40803}... -[2023-09-12 20:59:16,983][29523] Initializing env for player 5, init_info: {'port': 41003}... -[2023-09-12 20:59:16,985][29521] Initializing env for player 7, init_info: {'port': 40803}... -[2023-09-12 20:59:16,998][29522] Decorrelating experience for 64 frames... -[2023-09-12 20:59:17,004][29453] Initialized w:0 v:2 player:7 -[2023-09-12 20:59:17,006][29453] Initialized w:0 v:2 player:2 -[2023-09-12 20:59:17,007][29453] Initialized w:0 v:2 player:4 -[2023-09-12 20:59:17,007][29453] Initialized w:0 v:2 player:1 -[2023-09-12 20:59:17,007][29453] Initialized w:0 v:2 player:0 -[2023-09-12 20:59:17,008][29453] Initialized w:0 v:2 player:5 -[2023-09-12 20:59:17,009][29485] Initialized w:1 v:2 player:3 -[2023-09-12 20:59:17,010][29485] Initialized w:1 v:2 player:5 -[2023-09-12 20:59:17,011][29485] Initialized w:1 v:2 player:4 -[2023-09-12 20:59:17,012][29453] Initialized w:0 v:2 player:6 -[2023-09-12 20:59:17,012][29485] Initialized w:1 v:2 player:1 -[2023-09-12 20:59:17,013][29453] Initialized w:0 v:2 player:3 -[2023-09-12 20:59:17,013][29485] Initialized w:1 v:2 player:6 -[2023-09-12 20:59:17,014][29453] 8 agent workers initialized for env 0! -[2023-09-12 20:59:17,014][29485] Initialized w:1 v:2 player:0 -[2023-09-12 20:59:17,019][29485] Initialized w:1 v:2 player:2 -[2023-09-12 20:59:16,962][29520] Initializing env for player 7, init_info: {'port': 40703}... -[2023-09-12 20:59:17,053][29523] Initializing env for player 6, init_info: {'port': 41003}... -[2023-09-12 20:59:17,091][29453] Decorrelating experience for 64 frames... -[2023-09-12 20:59:17,111][29523] Initializing env for player 7, init_info: {'port': 41003}... -[2023-09-12 20:59:17,882][29453] Port 40303 is available -[2023-09-12 20:59:17,883][29453] Using port 40303 -[2023-09-12 20:59:17,887][29486] Initialized w:2 v:2 player:4 -[2023-09-12 20:59:17,890][29486] Initialized w:2 v:2 player:6 -[2023-09-12 20:59:17,890][29486] Initialized w:2 v:2 player:3 -[2023-09-12 20:59:17,890][29486] Initialized w:2 v:2 player:2 -[2023-09-12 20:59:17,891][29486] Initialized w:2 v:2 player:1 -[2023-09-12 20:59:17,891][29486] Initialized w:2 v:2 player:7 -[2023-09-12 20:59:17,891][29486] Initialized w:2 v:2 player:0 -[2023-09-12 20:59:17,891][29486] Initialized w:2 v:2 player:5 -[2023-09-12 20:59:17,894][29486] 8 agent workers initialized for env 2! -[2023-09-12 20:59:17,954][29486] Decorrelating experience for 64 frames... -[2023-09-12 20:59:17,981][29519] Initialized w:3 v:2 player:3 -[2023-09-12 20:59:17,982][29519] Initialized w:3 v:2 player:5 -[2023-09-12 20:59:17,982][29519] Initialized w:3 v:2 player:6 -[2023-09-12 20:59:17,982][29519] Initialized w:3 v:2 player:1 -[2023-09-12 20:59:17,982][29519] Initialized w:3 v:2 player:7 -[2023-09-12 20:59:17,983][29519] Initialized w:3 v:2 player:2 -[2023-09-12 20:59:17,983][29519] Initialized w:3 v:2 player:0 -[2023-09-12 20:59:17,983][29519] Initialized w:3 v:2 player:4 -[2023-09-12 20:59:17,985][29519] 8 agent workers initialized for env 3! -[2023-09-12 20:59:18,007][29485] Initialized w:1 v:2 player:7 -[2023-09-12 20:59:18,008][29485] 8 agent workers initialized for env 1! -[2023-09-12 20:59:18,035][29453] Initializing env for player 0, init_info: {'port': 40303}... -[2023-09-12 20:59:18,040][29519] Decorrelating experience for 64 frames... -[2023-09-12 20:59:18,079][29453] Using port 40303 on host... -[2023-09-12 20:59:18,087][29453] Initializing env for player 1, init_info: {'port': 40303}... -[2023-09-12 20:59:18,134][29485] Decorrelating experience for 64 frames... -[2023-09-12 20:59:18,137][29453] Initializing env for player 2, init_info: {'port': 40303}... -[2023-09-12 20:59:18,191][29522] Port 40903 is available -[2023-09-12 20:59:18,191][29522] Using port 40903 -[2023-09-12 20:59:18,192][29522] Initializing env for player 0, init_info: {'port': 40903}... -[2023-09-12 20:59:18,203][29453] Initializing env for player 3, init_info: {'port': 40303}... -[2023-09-12 20:59:18,232][29522] Using port 40903 on host... -[2023-09-12 20:59:18,246][29522] Initializing env for player 1, init_info: {'port': 40903}... -[2023-09-12 20:59:18,251][29453] Initializing env for player 4, init_info: {'port': 40303}... -[2023-09-12 20:59:18,302][29522] Initializing env for player 2, init_info: {'port': 40903}... -[2023-09-12 20:59:18,323][29453] Initializing env for player 5, init_info: {'port': 40303}... -[2023-09-12 20:59:18,355][29522] Initializing env for player 3, init_info: {'port': 40903}... -[2023-09-12 20:59:18,383][29453] Initializing env for player 6, init_info: {'port': 40303}... -[2023-09-12 20:59:18,410][29522] Initializing env for player 4, init_info: {'port': 40903}... -[2023-09-12 20:59:18,411][29521] Initialized w:5 v:3 player:1 -[2023-09-12 20:59:18,415][29521] Initialized w:5 v:3 player:2 -[2023-09-12 20:59:18,416][29521] Initialized w:5 v:3 player:0 -[2023-09-12 20:59:18,416][29521] Initialized w:5 v:3 player:4 -[2023-09-12 20:59:18,416][29521] Initialized w:5 v:3 player:5 -[2023-09-12 20:59:18,416][29521] Initialized w:5 v:3 player:6 -[2023-09-12 20:59:18,416][29521] Initialized w:5 v:3 player:7 -[2023-09-12 20:59:18,416][29521] Initialized w:5 v:3 player:3 -[2023-09-12 20:59:18,420][29521] 8 agent workers initialized for env 5! -[2023-09-12 20:59:18,435][29453] Initializing env for player 7, init_info: {'port': 40303}... -[2023-09-12 20:59:18,465][29523] Initialized w:7 v:3 player:7 -[2023-09-12 20:59:18,466][29523] Initialized w:7 v:3 player:0 -[2023-09-12 20:59:18,468][29523] Initialized w:7 v:3 player:5 -[2023-09-12 20:59:18,469][29523] Initialized w:7 v:3 player:1 -[2023-09-12 20:59:18,469][29523] Initialized w:7 v:3 player:2 -[2023-09-12 20:59:18,469][29523] Initialized w:7 v:3 player:3 -[2023-09-12 20:59:18,470][29523] Initialized w:7 v:3 player:6 -[2023-09-12 20:59:18,471][29523] Initialized w:7 v:3 player:4 -[2023-09-12 20:59:18,473][29523] 8 agent workers initialized for env 7! -[2023-09-12 20:59:18,479][29522] Initializing env for player 5, init_info: {'port': 40903}... -[2023-09-12 20:59:18,497][29521] Decorrelating experience for 96 frames... -[2023-09-12 20:59:18,522][29520] Initialized w:4 v:3 player:7 -[2023-09-12 20:59:18,524][29520] Initialized w:4 v:3 player:5 -[2023-09-12 20:59:18,526][29520] Initialized w:4 v:3 player:6 -[2023-09-12 20:59:18,526][29520] Initialized w:4 v:3 player:4 -[2023-09-12 20:59:18,527][29520] Initialized w:4 v:3 player:1 -[2023-09-12 20:59:18,528][29523] Decorrelating experience for 96 frames... -[2023-09-12 20:59:18,529][29520] Initialized w:4 v:3 player:0 -[2023-09-12 20:59:18,531][29520] Initialized w:4 v:3 player:3 -[2023-09-12 20:59:18,531][29520] Initialized w:4 v:3 player:2 -[2023-09-12 20:59:18,532][29520] 8 agent workers initialized for env 4! -[2023-09-12 20:59:18,539][29522] Initializing env for player 6, init_info: {'port': 40903}... -[2023-09-12 20:59:18,613][29522] Initializing env for player 7, init_info: {'port': 40903}... -[2023-09-12 20:59:18,618][29520] Decorrelating experience for 96 frames... -[2023-09-12 20:59:18,912][29519] Port 40603 is available -[2023-09-12 20:59:18,912][29519] Using port 40603 -[2023-09-12 20:59:18,913][29519] Initializing env for player 0, init_info: {'port': 40603}... -[2023-09-12 20:59:18,954][29519] Using port 40603 on host... -[2023-09-12 20:59:18,967][29519] Initializing env for player 1, init_info: {'port': 40603}... -[2023-09-12 20:59:18,984][29486] Port 40503 is available -[2023-09-12 20:59:18,984][29486] Using port 40503 -[2023-09-12 20:59:18,984][29486] Initializing env for player 0, init_info: {'port': 40503}... -[2023-09-12 20:59:19,027][29519] Initializing env for player 2, init_info: {'port': 40603}... -[2023-09-12 20:59:19,030][29486] Using port 40503 on host... -[2023-09-12 20:59:19,043][29486] Initializing env for player 1, init_info: {'port': 40503}... -[2023-09-12 20:59:19,075][29519] Initializing env for player 3, init_info: {'port': 40603}... -[2023-09-12 20:59:19,093][29486] Initializing env for player 2, init_info: {'port': 40503}... -[2023-09-12 20:59:19,138][29519] Initializing env for player 4, init_info: {'port': 40603}... -[2023-09-12 20:59:19,142][29485] Port 40403 is available -[2023-09-12 20:59:19,142][29485] Using port 40403 -[2023-09-12 20:59:19,144][29486] Initializing env for player 3, init_info: {'port': 40503}... -[2023-09-12 20:59:19,191][29519] Initializing env for player 5, init_info: {'port': 40603}... -[2023-09-12 20:59:19,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 20:59:19,195][29486] Initializing env for player 4, init_info: {'port': 40503}... -[2023-09-12 20:59:19,243][29519] Initializing env for player 6, init_info: {'port': 40603}... -[2023-09-12 20:59:19,245][29486] Initializing env for player 5, init_info: {'port': 40503}... -[2023-09-12 20:59:19,322][29486] Initializing env for player 6, init_info: {'port': 40503}... -[2023-09-12 20:59:19,327][29519] Initializing env for player 7, init_info: {'port': 40603}... -[2023-09-12 20:59:19,375][29486] Initializing env for player 7, init_info: {'port': 40503}... -[2023-09-12 20:59:19,881][29453] Initialized w:0 v:3 player:4 -[2023-09-12 20:59:19,884][29453] Initialized w:0 v:3 player:5 -[2023-09-12 20:59:19,884][29453] Initialized w:0 v:3 player:2 -[2023-09-12 20:59:19,885][29453] Initialized w:0 v:3 player:6 -[2023-09-12 20:59:19,886][29453] Initialized w:0 v:3 player:0 -[2023-09-12 20:59:19,887][29453] Initialized w:0 v:3 player:1 -[2023-09-12 20:59:19,887][29453] Initialized w:0 v:3 player:3 -[2023-09-12 20:59:19,887][29453] Initialized w:0 v:3 player:7 -[2023-09-12 20:59:19,889][29453] 8 agent workers initialized for env 0! -[2023-09-12 20:59:19,959][29453] Decorrelating experience for 96 frames... -[2023-09-12 20:59:20,042][29522] Initialized w:6 v:3 player:4 -[2023-09-12 20:59:20,043][29522] Initialized w:6 v:3 player:2 -[2023-09-12 20:59:20,043][29522] Initialized w:6 v:3 player:3 -[2023-09-12 20:59:20,044][29522] Initialized w:6 v:3 player:1 -[2023-09-12 20:59:20,045][29522] Initialized w:6 v:3 player:6 -[2023-09-12 20:59:20,045][29522] Initialized w:6 v:3 player:5 -[2023-09-12 20:59:20,045][29522] Initialized w:6 v:3 player:0 -[2023-09-12 20:59:20,045][29522] Initialized w:6 v:3 player:7 -[2023-09-12 20:59:20,047][29522] 8 agent workers initialized for env 6! -[2023-09-12 20:59:20,089][29522] Decorrelating experience for 96 frames... -[2023-09-12 20:59:20,710][29486] Initialized w:2 v:3 player:0 -[2023-09-12 20:59:20,713][29486] Initialized w:2 v:3 player:7 -[2023-09-12 20:59:20,713][29486] Initialized w:2 v:3 player:5 -[2023-09-12 20:59:20,713][29486] Initialized w:2 v:3 player:4 -[2023-09-12 20:59:20,713][29486] Initialized w:2 v:3 player:3 -[2023-09-12 20:59:20,714][29486] Initialized w:2 v:3 player:2 -[2023-09-12 20:59:20,714][29486] Initialized w:2 v:3 player:6 -[2023-09-12 20:59:20,714][29486] Initialized w:2 v:3 player:1 -[2023-09-12 20:59:20,717][29486] 8 agent workers initialized for env 2! -[2023-09-12 20:59:20,720][29519] Initialized w:3 v:3 player:0 -[2023-09-12 20:59:20,721][29519] Initialized w:3 v:3 player:5 -[2023-09-12 20:59:20,721][29519] Initialized w:3 v:3 player:4 -[2023-09-12 20:59:20,721][29519] Initialized w:3 v:3 player:7 -[2023-09-12 20:59:20,721][29519] Initialized w:3 v:3 player:1 -[2023-09-12 20:59:20,721][29519] Initialized w:3 v:3 player:6 -[2023-09-12 20:59:20,721][29519] Initialized w:3 v:3 player:3 -[2023-09-12 20:59:20,721][29519] Initialized w:3 v:3 player:2 -[2023-09-12 20:59:20,726][29519] 8 agent workers initialized for env 3! -[2023-09-12 20:59:20,769][29485] Initializing env for player 0, init_info: {'port': 40403}... -[2023-09-12 20:59:20,777][29519] Decorrelating experience for 96 frames... -[2023-09-12 20:59:20,786][29486] Decorrelating experience for 96 frames... -[2023-09-12 20:59:20,810][29485] Using port 40403 on host... -[2023-09-12 20:59:20,813][29485] Initializing env for player 1, init_info: {'port': 40403}... -[2023-09-12 20:59:20,875][29485] Initializing env for player 2, init_info: {'port': 40403}... -[2023-09-12 20:59:20,935][29485] Initializing env for player 3, init_info: {'port': 40403}... -[2023-09-12 20:59:20,991][29485] Initializing env for player 4, init_info: {'port': 40403}... -[2023-09-12 20:59:21,043][29485] Initializing env for player 5, init_info: {'port': 40403}... -[2023-09-12 20:59:21,118][29485] Initializing env for player 6, init_info: {'port': 40403}... -[2023-09-12 20:59:21,167][29485] Initializing env for player 7, init_info: {'port': 40403}... -[2023-09-12 20:59:22,760][29273] Signal inference workers to stop experience collection... -[2023-09-12 20:59:22,767][29452] InferenceWorker_p0-w0: stopping experience collection -[2023-09-12 20:59:22,814][29485] Initialized w:1 v:3 player:0 -[2023-09-12 20:59:22,816][29485] Initialized w:1 v:3 player:6 -[2023-09-12 20:59:22,816][29485] Initialized w:1 v:3 player:4 -[2023-09-12 20:59:22,816][29485] Initialized w:1 v:3 player:5 -[2023-09-12 20:59:22,817][29485] Initialized w:1 v:3 player:7 -[2023-09-12 20:59:22,817][29485] Initialized w:1 v:3 player:2 -[2023-09-12 20:59:22,817][29485] Initialized w:1 v:3 player:1 -[2023-09-12 20:59:22,817][29485] Initialized w:1 v:3 player:3 -[2023-09-12 20:59:22,819][29485] 8 agent workers initialized for env 1! -[2023-09-12 20:59:22,852][29485] Decorrelating experience for 96 frames... -[2023-09-12 20:59:23,836][29273] EvtLoop [learner_proc0_evt_loop, process=learner_proc0] unhandled exception in slot='on_new_training_batch' connected to emitter=Emitter(object_id='Batcher_0', signal_name='training_batches_available'), args=(0,) -Traceback (most recent call last): - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py", line 355, in _process_signal - slot_callable(*args) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner_worker.py", line 150, in on_new_training_batch - stats = self.learner.train(self.batcher.training_batches[batch_idx]) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 1046, in train - train_stats = self._train(buff, self.cfg.batch_size, experience_size, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 731, in _train - ) = self._calculate_losses(mb, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 649, in _calculate_losses - exploration_loss = self.exploration_loss_func(action_distribution, valids, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 477, in _symmetric_kl_exploration_loss - kl_prior = action_distribution.symmetric_kl_with_uniform_prior() - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py", line 247, in symmetric_kl_with_uniform_prior - sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions] - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py", line 247, in - sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions] -AttributeError: 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' -[2023-09-12 20:59:23,837][29273] Unhandled exception 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' in evt loop learner_proc0_evt_loop -[2023-09-12 20:59:24,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 103.5. Samples: 1552. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 20:59:24,351][28625] Heartbeat connected on Batcher_0 -[2023-09-12 20:59:24,357][28625] Heartbeat connected on InferenceWorker_p0-w0 -[2023-09-12 20:59:24,362][28625] Heartbeat connected on RolloutWorker_w0 -[2023-09-12 20:59:24,365][28625] Heartbeat connected on RolloutWorker_w1 -[2023-09-12 20:59:24,368][28625] Heartbeat connected on RolloutWorker_w2 -[2023-09-12 20:59:24,371][28625] Heartbeat connected on RolloutWorker_w3 -[2023-09-12 20:59:24,374][28625] Heartbeat connected on RolloutWorker_w4 -[2023-09-12 20:59:24,377][28625] Heartbeat connected on RolloutWorker_w5 -[2023-09-12 20:59:24,381][28625] Heartbeat connected on RolloutWorker_w6 -[2023-09-12 20:59:24,384][28625] Heartbeat connected on RolloutWorker_w7 -[2023-09-12 20:59:29,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 257.6. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 20:59:34,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 206.1. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 20:59:39,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 171.7. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 20:59:44,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 147.2. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 20:59:49,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 128.8. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 20:59:54,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 114.5. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 20:59:59,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 114.5. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:00:04,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 114.5. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:00:09,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 80.0. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:00:14,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:00:19,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:00:24,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:00:29,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:00:34,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:00:39,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:00:44,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:00:49,192][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 5152. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:00:52,234][28625] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 28625], exiting... -[2023-09-12 21:00:52,235][29273] Stopping Batcher_0... -[2023-09-12 21:00:52,236][29273] Loop batcher_evt_loop terminating... -[2023-09-12 21:00:52,235][28625] Runner profile tree view: -main_loop: 107.8515 -[2023-09-12 21:00:52,236][28625] Collected {0: 0}, FPS: 0.0 -[2023-09-12 21:00:52,259][29452] Weights refcount: 2 0 -[2023-09-12 21:00:52,260][29452] Stopping InferenceWorker_p0-w0... -[2023-09-12 21:00:52,260][29452] Loop inference_proc0-0_evt_loop terminating... -[2023-09-12 21:00:52,401][28625] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json -[2023-09-12 21:00:52,402][28625] Overriding arg 'num_workers' with value 1 passed from command line -[2023-09-12 21:00:52,403][28625] Adding new argument 'no_render'=True that is not in the saved config file! -[2023-09-12 21:00:52,404][28625] Adding new argument 'save_video'=True that is not in the saved config file! -[2023-09-12 21:00:52,405][28625] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file! -[2023-09-12 21:00:52,405][28625] Adding new argument 'video_name'=None that is not in the saved config file! -[2023-09-12 21:00:52,406][28625] Adding new argument 'max_num_frames'=1000000000.0 that is not in the saved config file! -[2023-09-12 21:00:52,407][28625] Adding new argument 'max_num_episodes'=10 that is not in the saved config file! -[2023-09-12 21:00:52,408][28625] Adding new argument 'push_to_hub'=False that is not in the saved config file! -[2023-09-12 21:00:52,408][28625] Adding new argument 'hf_repository'=None that is not in the saved config file! -[2023-09-12 21:00:52,409][28625] Adding new argument 'policy_index'=0 that is not in the saved config file! -[2023-09-12 21:00:52,410][28625] Adding new argument 'eval_deterministic'=False that is not in the saved config file! -[2023-09-12 21:00:52,412][28625] Adding new argument 'train_script'=None that is not in the saved config file! -[2023-09-12 21:00:52,413][28625] Adding new argument 'enjoy_script'=None that is not in the saved config file! -[2023-09-12 21:00:52,413][28625] Using frameskip 1 and render_action_repeat=4 for evaluation -[2023-09-12 21:00:52,416][28625] Multi agent env, num agents: 8 -[2023-09-12 21:00:52,448][28625] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 21:00:52,453][28625] RunningMeanStd input shape: (23,) -[2023-09-12 21:00:52,454][28625] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 21:00:52,456][28625] RunningMeanStd input shape: (1,) -[2023-09-12 21:00:52,471][28625] ConvEncoder: input_channels=3 -[2023-09-12 21:00:52,666][28625] Conv encoder output size: 512 -[2023-09-12 21:00:52,669][28625] Policy head output size: 640 -[2023-09-12 21:00:53,778][28625] No checkpoints found -[2023-09-12 21:00:55,451][29521] Stopping RolloutWorker_w5... -[2023-09-12 21:00:55,451][29521] Loop rollout_proc5_evt_loop terminating... -[2023-09-12 21:00:55,451][29519] Stopping RolloutWorker_w3... -[2023-09-12 21:00:55,451][29520] Stopping RolloutWorker_w4... -[2023-09-12 21:00:55,452][29519] Loop rollout_proc3_evt_loop terminating... -[2023-09-12 21:00:55,452][29486] Stopping RolloutWorker_w2... -[2023-09-12 21:00:55,452][29520] Loop rollout_proc4_evt_loop terminating... -[2023-09-12 21:00:55,452][29485] Stopping RolloutWorker_w1... -[2023-09-12 21:00:55,452][29486] Loop rollout_proc2_evt_loop terminating... -[2023-09-12 21:00:55,453][29485] Loop rollout_proc1_evt_loop terminating... -[2023-09-12 21:00:55,453][29523] Stopping RolloutWorker_w7... -[2023-09-12 21:00:55,453][29522] Stopping RolloutWorker_w6... -[2023-09-12 21:00:55,453][29523] Loop rollout_proc7_evt_loop terminating... -[2023-09-12 21:00:55,454][29522] Loop rollout_proc6_evt_loop terminating... -[2023-09-12 21:00:55,457][29453] Stopping RolloutWorker_w0... -[2023-09-12 21:00:55,458][29453] Loop rollout_proc0_evt_loop terminating... -[2023-09-12 21:01:01,865][28625] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json -[2023-09-12 21:01:01,866][28625] Overriding arg 'num_workers' with value 1 passed from command line -[2023-09-12 21:01:01,867][28625] Adding new argument 'no_render'=True that is not in the saved config file! -[2023-09-12 21:01:01,869][28625] Adding new argument 'save_video'=True that is not in the saved config file! -[2023-09-12 21:01:01,870][28625] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file! -[2023-09-12 21:01:01,872][28625] Adding new argument 'video_name'=None that is not in the saved config file! -[2023-09-12 21:01:01,873][28625] Adding new argument 'max_num_frames'=1000000000.0 that is not in the saved config file! -[2023-09-12 21:01:01,875][28625] Adding new argument 'max_num_episodes'=10 that is not in the saved config file! -[2023-09-12 21:01:01,876][28625] Adding new argument 'push_to_hub'=False that is not in the saved config file! -[2023-09-12 21:01:01,877][28625] Adding new argument 'hf_repository'=None that is not in the saved config file! -[2023-09-12 21:01:01,877][28625] Adding new argument 'policy_index'=0 that is not in the saved config file! -[2023-09-12 21:01:01,878][28625] Adding new argument 'eval_deterministic'=False that is not in the saved config file! -[2023-09-12 21:01:01,879][28625] Adding new argument 'train_script'=None that is not in the saved config file! -[2023-09-12 21:01:01,879][28625] Adding new argument 'enjoy_script'=None that is not in the saved config file! -[2023-09-12 21:01:01,880][28625] Using frameskip 1 and render_action_repeat=4 for evaluation -[2023-09-12 21:01:01,881][28625] Multi agent env, num agents: 8 -[2023-09-12 21:01:01,913][28625] RunningMeanStd input shape: (23,) -[2023-09-12 21:01:01,914][28625] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 21:01:01,915][28625] RunningMeanStd input shape: (1,) -[2023-09-12 21:01:01,927][28625] ConvEncoder: input_channels=3 -[2023-09-12 21:01:01,971][28625] Conv encoder output size: 512 -[2023-09-12 21:01:01,974][28625] Policy head output size: 640 -[2023-09-12 21:01:02,005][28625] No checkpoints found -[2023-09-12 21:01:43,594][28625] Environment doom_basic already registered, overwriting... -[2023-09-12 21:01:43,596][28625] Environment doom_two_colors_easy already registered, overwriting... -[2023-09-12 21:01:43,599][28625] Environment doom_two_colors_hard already registered, overwriting... -[2023-09-12 21:01:43,601][28625] Environment doom_dm already registered, overwriting... -[2023-09-12 21:01:43,603][28625] Environment doom_dwango5 already registered, overwriting... -[2023-09-12 21:01:43,604][28625] Environment doom_my_way_home_flat_actions already registered, overwriting... -[2023-09-12 21:01:43,605][28625] Environment doom_defend_the_center_flat_actions already registered, overwriting... -[2023-09-12 21:01:43,606][28625] Environment doom_my_way_home already registered, overwriting... -[2023-09-12 21:01:43,607][28625] Environment doom_deadly_corridor already registered, overwriting... -[2023-09-12 21:01:43,608][28625] Environment doom_defend_the_center already registered, overwriting... -[2023-09-12 21:01:43,610][28625] Environment doom_defend_the_line already registered, overwriting... -[2023-09-12 21:01:43,611][28625] Environment doom_health_gathering already registered, overwriting... -[2023-09-12 21:01:43,613][28625] Environment doom_health_gathering_supreme already registered, overwriting... -[2023-09-12 21:01:43,613][28625] Environment doom_battle already registered, overwriting... -[2023-09-12 21:01:43,614][28625] Environment doom_battle2 already registered, overwriting... -[2023-09-12 21:01:43,614][28625] Environment doom_duel_bots already registered, overwriting... -[2023-09-12 21:01:43,615][28625] Environment doom_deathmatch_bots already registered, overwriting... -[2023-09-12 21:01:43,616][28625] Environment doom_duel already registered, overwriting... -[2023-09-12 21:01:43,616][28625] Environment doom_deathmatch_full already registered, overwriting... -[2023-09-12 21:01:43,617][28625] Environment doom_benchmark already registered, overwriting... -[2023-09-12 21:01:43,617][28625] register_encoder_factory: -[2023-09-12 21:01:43,646][28625] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json -[2023-09-12 21:01:43,650][28625] Overriding arg 'train_for_env_steps' with value 1000000 passed from command line -[2023-09-12 21:01:43,659][28625] Experiment dir /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment already exists! -[2023-09-12 21:01:43,661][28625] Resuming existing experiment from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment... -[2023-09-12 21:01:43,661][28625] Weights and Biases integration disabled -[2023-09-12 21:01:43,664][28625] Environment var CUDA_VISIBLE_DEVICES is 0,1 - -[2023-09-12 21:01:45,745][28625] Starting experiment with the following configuration: -help=False -algo=APPO -env=doom_dwango5 -experiment=default_experiment -train_dir=/home/cogstack/Documents/optuna/environments/sample_factory/train_dir -restart_behavior=resume -device=gpu -seed=None -num_policies=1 -async_rl=True -serial_mode=False -batched_sampling=False -num_batches_to_accumulate=2 -worker_num_splits=2 -policy_workers_per_policy=1 -max_policy_lag=1000 -num_workers=8 -num_envs_per_worker=4 -batch_size=1024 -num_batches_per_epoch=1 -num_epochs=1 -rollout=32 -recurrence=32 -shuffle_minibatches=False -gamma=0.99 -reward_scale=1.0 -reward_clip=1000.0 -value_bootstrap=False -normalize_returns=True -exploration_loss_coeff=0.001 -value_loss_coeff=0.5 -kl_loss_coeff=0.0 -exploration_loss=symmetric_kl -gae_lambda=0.95 -ppo_clip_ratio=0.1 -ppo_clip_value=0.2 -with_vtrace=False -vtrace_rho=1.0 -vtrace_c=1.0 -optimizer=adam -adam_eps=1e-06 -adam_beta1=0.9 -adam_beta2=0.999 -max_grad_norm=4.0 -learning_rate=0.0001 -lr_schedule=constant -lr_schedule_kl_threshold=0.008 -lr_adaptive_min=1e-06 -lr_adaptive_max=0.01 -obs_subtract_mean=0.0 -obs_scale=255.0 -normalize_input=True -normalize_input_keys=None -decorrelate_experience_max_seconds=0 -decorrelate_envs_on_one_worker=True -actor_worker_gpus=[] -set_workers_cpu_affinity=True -force_envs_single_thread=False -default_niceness=0 -log_to_file=True -experiment_summaries_interval=10 -flush_summaries_interval=30 -stats_avg=100 -summaries_use_frameskip=True -heartbeat_interval=20 -heartbeat_reporting_interval=600 -train_for_env_steps=1000000 -train_for_seconds=10000000000 -save_every_sec=120 -keep_checkpoints=2 -load_checkpoint_kind=latest -save_milestones_sec=-1 -save_best_every_sec=5 -save_best_metric=reward -save_best_after=100000 -benchmark=False -encoder_mlp_layers=[512, 512] -encoder_conv_architecture=convnet_simple -encoder_conv_mlp_layers=[512] -use_rnn=True -rnn_size=512 -rnn_type=gru -rnn_num_layers=1 -decoder_mlp_layers=[] -nonlinearity=elu -policy_initialization=orthogonal -policy_init_gain=1.0 -actor_critic_share_weights=True -adaptive_stddev=True -continuous_tanh_scale=0.0 -initial_stddev=1.0 -use_env_info_cache=False -env_gpu_actions=False -env_gpu_observations=True -env_frameskip=4 -env_framestack=1 -pixel_format=CHW -use_record_episode_statistics=False -with_wandb=False -wandb_user=None -wandb_project=sample_factory -wandb_group=None -wandb_job_type=SF -wandb_tags=[] -with_pbt=False -pbt_mix_policies_in_one_env=True -pbt_period_env_steps=5000000 -pbt_start_mutation=20000000 -pbt_replace_fraction=0.3 -pbt_mutation_rate=0.15 -pbt_replace_reward_gap=0.1 -pbt_replace_reward_gap_absolute=1e-06 -pbt_optimize_gamma=False -pbt_target_objective=true_objective -pbt_perturb_min=1.1 -pbt_perturb_max=1.5 -num_agents=-1 -num_humans=0 -num_bots=-1 -start_bot_difficulty=None -timelimit=None -res_w=128 -res_h=72 -wide_aspect_ratio=False -eval_env_frameskip=1 -fps=35 -command_line=--env=doom_dm --num_workers=8 --num_envs_per_worker=4 --train_for_env_steps=20000000 -cli_args={'env': 'doom_dm', 'num_workers': 8, 'num_envs_per_worker': 4, 'train_for_env_steps': 20000000} -git_hash=20b6d44612dad7d171f23e13b1f3b4c5e5631cf9 -git_repo_name=https://github.com/MattStammers/optuna.git -[2023-09-12 21:01:45,747][28625] Saving configuration to /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json... -[2023-09-12 21:01:46,757][28625] Rollout worker 0 uses device cpu -[2023-09-12 21:01:46,758][28625] Rollout worker 1 uses device cpu -[2023-09-12 21:01:46,760][28625] Rollout worker 2 uses device cpu -[2023-09-12 21:01:46,761][28625] Rollout worker 3 uses device cpu -[2023-09-12 21:01:46,763][28625] Rollout worker 4 uses device cpu -[2023-09-12 21:01:46,765][28625] Rollout worker 5 uses device cpu -[2023-09-12 21:01:46,767][28625] Rollout worker 6 uses device cpu -[2023-09-12 21:01:46,768][28625] Rollout worker 7 uses device cpu -[2023-09-12 21:01:46,937][28625] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 21:01:46,939][28625] InferenceWorker_p0-w0: min num requests: 2 -[2023-09-12 21:01:46,973][28625] Starting all processes... -[2023-09-12 21:01:46,974][28625] Starting process learner_proc0 -[2023-09-12 21:01:48,714][39537] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 21:01:48,713][28625] Starting all processes... -[2023-09-12 21:01:48,714][39537] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for learning process 0 -[2023-09-12 21:01:48,719][28625] Starting process inference_proc0-0 -[2023-09-12 21:01:48,719][28625] Starting process rollout_proc0 -[2023-09-12 21:01:48,720][28625] Starting process rollout_proc1 -[2023-09-12 21:01:48,720][28625] Starting process rollout_proc2 -[2023-09-12 21:01:48,725][28625] Starting process rollout_proc3 -[2023-09-12 21:01:48,725][28625] Starting process rollout_proc4 -[2023-09-12 21:01:48,759][39537] Num visible devices: 1 -[2023-09-12 21:01:48,725][28625] Starting process rollout_proc5 -[2023-09-12 21:01:48,726][28625] Starting process rollout_proc6 -[2023-09-12 21:01:48,726][28625] Starting process rollout_proc7 -[2023-09-12 21:01:48,796][39537] Starting seed is not provided -[2023-09-12 21:01:48,797][39537] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 21:01:48,797][39537] Initializing actor-critic model on device cuda:0 -[2023-09-12 21:01:48,797][39537] RunningMeanStd input shape: (23,) -[2023-09-12 21:01:48,798][39537] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 21:01:48,798][39537] RunningMeanStd input shape: (1,) -[2023-09-12 21:01:48,810][39537] ConvEncoder: input_channels=3 -[2023-09-12 21:01:48,954][39537] Conv encoder output size: 512 -[2023-09-12 21:01:48,956][39537] Policy head output size: 640 -[2023-09-12 21:01:48,984][39537] Created Actor Critic model with architecture: -[2023-09-12 21:01:48,986][39537] ActorCriticSharedWeights( - (obs_normalizer): ObservationNormalizer( - (running_mean_std): RunningMeanStdDictInPlace( - (running_mean_std): ModuleDict( - (measurements): RunningMeanStdInPlace() - (obs): RunningMeanStdInPlace() - ) - ) - ) - (returns_normalizer): RecursiveScriptModule(original_name=RunningMeanStdInPlace) - (encoder): VizdoomEncoder( - (basic_encoder): ConvEncoder( - (enc): RecursiveScriptModule( - original_name=ConvEncoderImpl - (conv_head): RecursiveScriptModule( - original_name=Sequential - (0): RecursiveScriptModule(original_name=Conv2d) - (1): RecursiveScriptModule(original_name=ELU) - (2): RecursiveScriptModule(original_name=Conv2d) - (3): RecursiveScriptModule(original_name=ELU) - (4): RecursiveScriptModule(original_name=Conv2d) - (5): RecursiveScriptModule(original_name=ELU) - ) - (mlp_layers): RecursiveScriptModule( - original_name=Sequential - (0): RecursiveScriptModule(original_name=Linear) - (1): RecursiveScriptModule(original_name=ELU) - ) - ) - ) - (measurements_head): Sequential( - (0): Linear(in_features=23, out_features=128, bias=True) - (1): ELU(alpha=1.0) - (2): Linear(in_features=128, out_features=128, bias=True) - (3): ELU(alpha=1.0) - ) - ) - (core): ModelCoreRNN( - (core): GRU(640, 512) - ) - (decoder): MlpDecoder( - (mlp): Identity() - ) - (critic_linear): Linear(in_features=512, out_features=1, bias=True) - (action_parameterization): ActionParameterizationDefault( - (distribution_linear): Linear(in_features=512, out_features=15, bias=True) - ) -) -[2023-09-12 21:01:50,408][39537] Using optimizer -[2023-09-12 21:01:50,409][39537] No checkpoints found -[2023-09-12 21:01:50,409][39537] Did not load from checkpoint, starting from scratch! -[2023-09-12 21:01:50,409][39537] Initialized policy 0 weights for model version 0 -[2023-09-12 21:01:50,412][39537] LearnerWorker_p0 finished initialization! -[2023-09-12 21:01:50,412][39537] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 21:01:50,710][39685] Worker 0 uses CPU cores [0, 1, 2, 3] -[2023-09-12 21:01:50,780][39698] Worker 3 uses CPU cores [12, 13, 14, 15] -[2023-09-12 21:01:50,819][39731] Worker 4 uses CPU cores [16, 17, 18, 19] -[2023-09-12 21:01:50,857][39734] Worker 7 uses CPU cores [28, 29, 30, 31] -[2023-09-12 21:01:50,881][39699] Worker 5 uses CPU cores [20, 21, 22, 23] -[2023-09-12 21:01:50,915][39686] Using GPUs [0] for process 0 (actually maps to GPUs [0]) -[2023-09-12 21:01:50,915][39686] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 -[2023-09-12 21:01:50,931][39696] Worker 2 uses CPU cores [8, 9, 10, 11] -[2023-09-12 21:01:50,954][39686] Num visible devices: 1 -[2023-09-12 21:01:50,992][39733] Worker 6 uses CPU cores [24, 25, 26, 27] -[2023-09-12 21:01:51,090][39697] Worker 1 uses CPU cores [4, 5, 6, 7] -[2023-09-12 21:01:51,618][39686] RunningMeanStd input shape: (23,) -[2023-09-12 21:01:51,618][39686] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 21:01:51,618][39686] RunningMeanStd input shape: (1,) -[2023-09-12 21:01:51,630][39686] ConvEncoder: input_channels=3 -[2023-09-12 21:01:51,739][39686] Conv encoder output size: 512 -[2023-09-12 21:01:51,740][39686] Policy head output size: 640 -[2023-09-12 21:01:52,083][28625] Inference worker 0-0 is ready! -[2023-09-12 21:01:52,085][28625] All inference workers are ready! Signal rollout workers to start! -[2023-09-12 21:01:52,088][39685] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,090][39698] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,091][39734] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,092][39696] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,092][39699] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,092][39697] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,093][39731] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,094][39733] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,118][39685] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 21:01:52,121][39685] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,124][39734] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 21:01:52,125][39697] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 21:01:52,125][39699] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 21:01:52,126][39696] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 21:01:52,127][39731] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 21:01:52,128][39734] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,129][39697] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,129][39699] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,129][39696] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,130][39731] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,134][39698] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 21:01:52,139][39733] Doom resolution: 160x120, resize resolution: (128, 72) -[2023-09-12 21:01:52,139][39698] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,143][39733] Multi agent env, num agents: 8 -[2023-09-12 21:01:52,151][39685] Port 40300 is available -[2023-09-12 21:01:52,151][39685] Using port 40300 -[2023-09-12 21:01:52,152][39685] Initializing env for player 0, init_info: {'port': 40300}... -[2023-09-12 21:01:52,160][39697] Port 40400 is available -[2023-09-12 21:01:52,160][39697] Using port 40400 -[2023-09-12 21:01:52,161][39696] Port 40500 is available -[2023-09-12 21:01:52,161][39699] Port 40800 is available -[2023-09-12 21:01:52,161][39696] Using port 40500 -[2023-09-12 21:01:52,161][39697] Initializing env for player 0, init_info: {'port': 40400}... -[2023-09-12 21:01:52,161][39699] Using port 40800 -[2023-09-12 21:01:52,161][39734] Port 41000 is available -[2023-09-12 21:01:52,161][39734] Using port 41000 -[2023-09-12 21:01:52,162][39696] Initializing env for player 0, init_info: {'port': 40500}... -[2023-09-12 21:01:52,162][39699] Initializing env for player 0, init_info: {'port': 40800}... -[2023-09-12 21:01:52,163][39734] Initializing env for player 0, init_info: {'port': 41000}... -[2023-09-12 21:01:52,176][39733] Port 40900 is available -[2023-09-12 21:01:52,176][39733] Using port 40900 -[2023-09-12 21:01:52,177][39733] Initializing env for player 0, init_info: {'port': 40900}... -[2023-09-12 21:01:52,185][39685] Using port 40300 on host... -[2023-09-12 21:01:52,186][39698] Port 40600 is available -[2023-09-12 21:01:52,186][39698] Using port 40600 -[2023-09-12 21:01:52,187][39698] Initializing env for player 0, init_info: {'port': 40600}... -[2023-09-12 21:01:52,193][39734] Using port 41000 on host... -[2023-09-12 21:01:52,195][39696] Using port 40500 on host... -[2023-09-12 21:01:52,197][39731] Port 40700 is available -[2023-09-12 21:01:52,197][39731] Using port 40700 -[2023-09-12 21:01:52,202][39685] Initializing env for player 1, init_info: {'port': 40300}... -[2023-09-12 21:01:52,207][39733] Using port 40900 on host... -[2023-09-12 21:01:52,209][39697] Using port 40400 on host... -[2023-09-12 21:01:52,210][39699] Using port 40800 on host... -[2023-09-12 21:01:52,212][39696] Initializing env for player 1, init_info: {'port': 40500}... -[2023-09-12 21:01:52,214][39734] Initializing env for player 1, init_info: {'port': 41000}... -[2023-09-12 21:01:52,217][39699] Initializing env for player 1, init_info: {'port': 40800}... -[2023-09-12 21:01:52,219][39697] Initializing env for player 1, init_info: {'port': 40400}... -[2023-09-12 21:01:52,229][39733] Initializing env for player 1, init_info: {'port': 40900}... -[2023-09-12 21:01:52,229][39698] Using port 40600 on host... -[2023-09-12 21:01:52,238][39698] Initializing env for player 1, init_info: {'port': 40600}... -[2023-09-12 21:01:52,253][39685] Initializing env for player 2, init_info: {'port': 40300}... -[2023-09-12 21:01:52,263][39696] Initializing env for player 2, init_info: {'port': 40500}... -[2023-09-12 21:01:52,264][39734] Initializing env for player 2, init_info: {'port': 41000}... -[2023-09-12 21:01:52,267][39699] Initializing env for player 2, init_info: {'port': 40800}... -[2023-09-12 21:01:52,274][39697] Initializing env for player 2, init_info: {'port': 40400}... -[2023-09-12 21:01:52,279][39733] Initializing env for player 2, init_info: {'port': 40900}... -[2023-09-12 21:01:52,291][39698] Initializing env for player 2, init_info: {'port': 40600}... -[2023-09-12 21:01:52,303][39685] Initializing env for player 3, init_info: {'port': 40300}... -[2023-09-12 21:01:52,315][39734] Initializing env for player 3, init_info: {'port': 41000}... -[2023-09-12 21:01:52,321][39697] Initializing env for player 3, init_info: {'port': 40400}... -[2023-09-12 21:01:52,322][39696] Initializing env for player 3, init_info: {'port': 40500}... -[2023-09-12 21:01:52,324][39699] Initializing env for player 3, init_info: {'port': 40800}... -[2023-09-12 21:01:52,335][39733] Initializing env for player 3, init_info: {'port': 40900}... -[2023-09-12 21:01:52,341][39698] Initializing env for player 3, init_info: {'port': 40600}... -[2023-09-12 21:01:52,353][39685] Initializing env for player 4, init_info: {'port': 40300}... -[2023-09-12 21:01:52,371][39696] Initializing env for player 4, init_info: {'port': 40500}... -[2023-09-12 21:01:52,370][39734] Initializing env for player 4, init_info: {'port': 41000}... -[2023-09-12 21:01:52,371][39697] Initializing env for player 4, init_info: {'port': 40400}... -[2023-09-12 21:01:52,383][39733] Initializing env for player 4, init_info: {'port': 40900}... -[2023-09-12 21:01:52,385][39699] Initializing env for player 4, init_info: {'port': 40800}... -[2023-09-12 21:01:52,392][39698] Initializing env for player 4, init_info: {'port': 40600}... -[2023-09-12 21:01:52,404][39685] Initializing env for player 5, init_info: {'port': 40300}... -[2023-09-12 21:01:52,418][39696] Initializing env for player 5, init_info: {'port': 40500}... -[2023-09-12 21:01:52,426][39734] Initializing env for player 5, init_info: {'port': 41000}... -[2023-09-12 21:01:52,427][39697] Initializing env for player 5, init_info: {'port': 40400}... -[2023-09-12 21:01:52,431][39699] Initializing env for player 5, init_info: {'port': 40800}... -[2023-09-12 21:01:52,435][39733] Initializing env for player 5, init_info: {'port': 40900}... -[2023-09-12 21:01:52,443][39698] Initializing env for player 5, init_info: {'port': 40600}... -[2023-09-12 21:01:52,455][39685] Initializing env for player 6, init_info: {'port': 40300}... -[2023-09-12 21:01:52,475][39696] Initializing env for player 6, init_info: {'port': 40500}... -[2023-09-12 21:01:52,477][39699] Initializing env for player 6, init_info: {'port': 40800}... -[2023-09-12 21:01:52,479][39697] Initializing env for player 6, init_info: {'port': 40400}... -[2023-09-12 21:01:52,483][39734] Initializing env for player 6, init_info: {'port': 41000}... -[2023-09-12 21:01:52,485][39733] Initializing env for player 6, init_info: {'port': 40900}... -[2023-09-12 21:01:52,499][39698] Initializing env for player 6, init_info: {'port': 40600}... -[2023-09-12 21:01:52,515][39685] Initializing env for player 7, init_info: {'port': 40300}... -[2023-09-12 21:01:52,527][39696] Initializing env for player 7, init_info: {'port': 40500}... -[2023-09-12 21:01:52,535][39734] Initializing env for player 7, init_info: {'port': 41000}... -[2023-09-12 21:01:52,535][39697] Initializing env for player 7, init_info: {'port': 40400}... -[2023-09-12 21:01:52,539][39733] Initializing env for player 7, init_info: {'port': 40900}... -[2023-09-12 21:01:52,539][39699] Initializing env for player 7, init_info: {'port': 40800}... -[2023-09-12 21:01:52,551][39698] Initializing env for player 7, init_info: {'port': 40600}... -[2023-09-12 21:01:53,664][28625] Fps is (10 sec: nan, 60 sec: nan, 300 sec: nan). Total num frames: 0. Throughput: 0: nan. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:01:53,759][39685] Initialized w:0 v:0 player:5 -[2023-09-12 21:01:53,761][39685] Initialized w:0 v:0 player:1 -[2023-09-12 21:01:53,762][39685] Initialized w:0 v:0 player:7 -[2023-09-12 21:01:53,762][39685] Initialized w:0 v:0 player:6 -[2023-09-12 21:01:53,762][39685] Initialized w:0 v:0 player:3 -[2023-09-12 21:01:53,762][39685] Initialized w:0 v:0 player:2 -[2023-09-12 21:01:53,763][39685] Initialized w:0 v:0 player:4 -[2023-09-12 21:01:53,763][39685] Initialized w:0 v:0 player:0 -[2023-09-12 21:01:53,765][39685] 8 agent workers initialized for env 0! -[2023-09-12 21:01:53,832][39685] Decorrelating experience for 0 frames... -[2023-09-12 21:01:53,833][39685] Port 40301 is available -[2023-09-12 21:01:53,833][39685] Using port 40301 -[2023-09-12 21:01:53,834][39685] Initializing env for player 0, init_info: {'port': 40301}... -[2023-09-12 21:01:53,863][39685] Using port 40301 on host... -[2023-09-12 21:01:53,884][39685] Initializing env for player 1, init_info: {'port': 40301}... -[2023-09-12 21:01:53,935][39685] Initializing env for player 2, init_info: {'port': 40301}... -[2023-09-12 21:01:53,991][39697] Initialized w:1 v:0 player:3 -[2023-09-12 21:01:53,992][39685] Initializing env for player 3, init_info: {'port': 40301}... -[2023-09-12 21:01:53,993][39697] Initialized w:1 v:0 player:2 -[2023-09-12 21:01:53,994][39697] Initialized w:1 v:0 player:6 -[2023-09-12 21:01:53,994][39697] Initialized w:1 v:0 player:1 -[2023-09-12 21:01:53,995][39697] Initialized w:1 v:0 player:5 -[2023-09-12 21:01:53,995][39697] Initialized w:1 v:0 player:0 -[2023-09-12 21:01:53,995][39697] Initialized w:1 v:0 player:7 -[2023-09-12 21:01:53,995][39697] Initialized w:1 v:0 player:4 -[2023-09-12 21:01:53,997][39697] 8 agent workers initialized for env 1! -[2023-09-12 21:01:54,031][39699] Initialized w:5 v:0 player:2 -[2023-09-12 21:01:54,034][39699] Initialized w:5 v:0 player:7 -[2023-09-12 21:01:54,034][39699] Initialized w:5 v:0 player:0 -[2023-09-12 21:01:54,035][39734] Initialized w:7 v:0 player:7 -[2023-09-12 21:01:54,034][39699] Initialized w:5 v:0 player:4 -[2023-09-12 21:01:54,035][39699] Initialized w:5 v:0 player:5 -[2023-09-12 21:01:54,035][39699] Initialized w:5 v:0 player:1 -[2023-09-12 21:01:54,036][39699] Initialized w:5 v:0 player:3 -[2023-09-12 21:01:54,036][39699] Initialized w:5 v:0 player:6 -[2023-09-12 21:01:54,038][39734] Initialized w:7 v:0 player:2 -[2023-09-12 21:01:54,038][39699] 8 agent workers initialized for env 5! -[2023-09-12 21:01:54,038][39734] Initialized w:7 v:0 player:3 -[2023-09-12 21:01:54,038][39734] Initialized w:7 v:0 player:4 -[2023-09-12 21:01:54,038][39734] Initialized w:7 v:0 player:6 -[2023-09-12 21:01:54,039][39734] Initialized w:7 v:0 player:0 -[2023-09-12 21:01:54,039][39734] Initialized w:7 v:0 player:5 -[2023-09-12 21:01:54,039][39734] Initialized w:7 v:0 player:1 -[2023-09-12 21:01:54,042][39734] 8 agent workers initialized for env 7! -[2023-09-12 21:01:54,055][39733] Initialized w:6 v:0 player:7 -[2023-09-12 21:01:54,055][39685] Initializing env for player 4, init_info: {'port': 40301}... -[2023-09-12 21:01:54,056][39697] Decorrelating experience for 0 frames... -[2023-09-12 21:01:54,057][39733] Initialized w:6 v:0 player:1 -[2023-09-12 21:01:54,058][39697] Port 40401 is available -[2023-09-12 21:01:54,058][39697] Using port 40401 -[2023-09-12 21:01:54,058][39733] Initialized w:6 v:0 player:3 -[2023-09-12 21:01:54,058][39697] Initializing env for player 0, init_info: {'port': 40401}... -[2023-09-12 21:01:54,058][39733] Initialized w:6 v:0 player:2 -[2023-09-12 21:01:54,058][39733] Initialized w:6 v:0 player:6 -[2023-09-12 21:01:54,059][39733] Initialized w:6 v:0 player:4 -[2023-09-12 21:01:54,059][39733] Initialized w:6 v:0 player:5 -[2023-09-12 21:01:54,059][39733] Initialized w:6 v:0 player:0 -[2023-09-12 21:01:54,061][39733] 8 agent workers initialized for env 6! -[2023-09-12 21:01:54,064][39731] Initializing env for player 0, init_info: {'port': 40700}... -[2023-09-12 21:01:54,086][39699] Decorrelating experience for 0 frames... -[2023-09-12 21:01:54,088][39699] Port 40801 is available -[2023-09-12 21:01:54,089][39699] Using port 40801 -[2023-09-12 21:01:54,089][39699] Initializing env for player 0, init_info: {'port': 40801}... -[2023-09-12 21:01:54,091][39734] Decorrelating experience for 0 frames... -[2023-09-12 21:01:54,093][39734] Port 41001 is available -[2023-09-12 21:01:54,094][39734] Using port 41001 -[2023-09-12 21:01:54,094][39697] Using port 40401 on host... -[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:0 -[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:7 -[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:3 -[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:5 -[2023-09-12 21:01:54,098][39731] Using port 40700 on host... -[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:1 -[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:6 -[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:4 -[2023-09-12 21:01:54,096][39698] Initialized w:3 v:0 player:2 -[2023-09-12 21:01:54,100][39698] 8 agent workers initialized for env 3! -[2023-09-12 21:01:54,103][39685] Initializing env for player 5, init_info: {'port': 40301}... -[2023-09-12 21:01:54,112][39733] Decorrelating experience for 0 frames... -[2023-09-12 21:01:54,114][39733] Port 40901 is available -[2023-09-12 21:01:54,115][39733] Using port 40901 -[2023-09-12 21:01:54,115][39731] Initializing env for player 1, init_info: {'port': 40700}... -[2023-09-12 21:01:54,115][39733] Initializing env for player 0, init_info: {'port': 40901}... -[2023-09-12 21:01:54,119][39696] Initialized w:2 v:0 player:3 -[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:6 -[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:5 -[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:2 -[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:0 -[2023-09-12 21:01:54,120][39696] Initialized w:2 v:0 player:1 -[2023-09-12 21:01:54,121][39696] Initialized w:2 v:0 player:4 -[2023-09-12 21:01:54,121][39696] Initialized w:2 v:0 player:7 -[2023-09-12 21:01:54,123][39697] Initializing env for player 1, init_info: {'port': 40401}... -[2023-09-12 21:01:54,124][39696] 8 agent workers initialized for env 2! -[2023-09-12 21:01:54,132][39699] Using port 40801 on host... -[2023-09-12 21:01:54,141][39699] Initializing env for player 1, init_info: {'port': 40801}... -[2023-09-12 21:01:54,148][39698] Decorrelating experience for 0 frames... -[2023-09-12 21:01:54,149][39698] Port 40601 is available -[2023-09-12 21:01:54,150][39698] Using port 40601 -[2023-09-12 21:01:54,150][39698] Initializing env for player 0, init_info: {'port': 40601}... -[2023-09-12 21:01:54,157][39733] Using port 40901 on host... -[2023-09-12 21:01:54,157][39696] Decorrelating experience for 0 frames... -[2023-09-12 21:01:54,159][39696] Port 40501 is available -[2023-09-12 21:01:54,159][39696] Using port 40501 -[2023-09-12 21:01:54,166][39733] Initializing env for player 1, init_info: {'port': 40901}... -[2023-09-12 21:01:54,167][39685] Initializing env for player 6, init_info: {'port': 40301}... -[2023-09-12 21:01:54,165][39731] Initializing env for player 2, init_info: {'port': 40700}... -[2023-09-12 21:01:54,173][39697] Initializing env for player 2, init_info: {'port': 40401}... -[2023-09-12 21:01:54,179][39698] Using port 40601 on host... -[2023-09-12 21:01:54,192][39699] Initializing env for player 2, init_info: {'port': 40801}... -[2023-09-12 21:01:54,201][39698] Initializing env for player 1, init_info: {'port': 40601}... -[2023-09-12 21:01:54,213][39685] Initializing env for player 7, init_info: {'port': 40301}... -[2023-09-12 21:01:54,217][39731] Initializing env for player 3, init_info: {'port': 40700}... -[2023-09-12 21:01:54,219][39733] Initializing env for player 2, init_info: {'port': 40901}... -[2023-09-12 21:01:54,230][39697] Initializing env for player 3, init_info: {'port': 40401}... -[2023-09-12 21:01:54,242][39699] Initializing env for player 3, init_info: {'port': 40801}... -[2023-09-12 21:01:54,251][39698] Initializing env for player 2, init_info: {'port': 40601}... -[2023-09-12 21:01:54,269][39733] Initializing env for player 3, init_info: {'port': 40901}... -[2023-09-12 21:01:54,273][39731] Initializing env for player 4, init_info: {'port': 40700}... -[2023-09-12 21:01:54,283][39697] Initializing env for player 4, init_info: {'port': 40401}... -[2023-09-12 21:01:54,303][39698] Initializing env for player 3, init_info: {'port': 40601}... -[2023-09-12 21:01:54,318][39699] Initializing env for player 4, init_info: {'port': 40801}... -[2023-09-12 21:01:54,327][39731] Initializing env for player 5, init_info: {'port': 40700}... -[2023-09-12 21:01:54,339][39697] Initializing env for player 5, init_info: {'port': 40401}... -[2023-09-12 21:01:54,339][39733] Initializing env for player 4, init_info: {'port': 40901}... -[2023-09-12 21:01:54,355][39698] Initializing env for player 4, init_info: {'port': 40601}... -[2023-09-12 21:01:54,372][39699] Initializing env for player 5, init_info: {'port': 40801}... -[2023-09-12 21:01:54,387][39731] Initializing env for player 6, init_info: {'port': 40700}... -[2023-09-12 21:01:54,388][39733] Initializing env for player 5, init_info: {'port': 40901}... -[2023-09-12 21:01:54,395][39697] Initializing env for player 6, init_info: {'port': 40401}... -[2023-09-12 21:01:54,410][39698] Initializing env for player 5, init_info: {'port': 40601}... -[2023-09-12 21:01:54,427][39699] Initializing env for player 6, init_info: {'port': 40801}... -[2023-09-12 21:01:54,438][39733] Initializing env for player 6, init_info: {'port': 40901}... -[2023-09-12 21:01:54,443][39731] Initializing env for player 7, init_info: {'port': 40700}... -[2023-09-12 21:01:54,446][39697] Initializing env for player 7, init_info: {'port': 40401}... -[2023-09-12 21:01:54,463][39698] Initializing env for player 6, init_info: {'port': 40601}... -[2023-09-12 21:01:54,479][39699] Initializing env for player 7, init_info: {'port': 40801}... -[2023-09-12 21:01:54,499][39733] Initializing env for player 7, init_info: {'port': 40901}... -[2023-09-12 21:01:54,523][39698] Initializing env for player 7, init_info: {'port': 40601}... -[2023-09-12 21:01:55,800][39685] Initialized w:0 v:1 player:4 -[2023-09-12 21:01:55,802][39685] Initialized w:0 v:1 player:1 -[2023-09-12 21:01:55,802][39685] Initialized w:0 v:1 player:0 -[2023-09-12 21:01:55,802][39685] Initialized w:0 v:1 player:5 -[2023-09-12 21:01:55,802][39685] Initialized w:0 v:1 player:7 -[2023-09-12 21:01:55,803][39685] Initialized w:0 v:1 player:3 -[2023-09-12 21:01:55,803][39685] Initialized w:0 v:1 player:6 -[2023-09-12 21:01:55,803][39685] Initialized w:0 v:1 player:2 -[2023-09-12 21:01:55,805][39685] 8 agent workers initialized for env 0! -[2023-09-12 21:01:55,848][39734] Initializing env for player 0, init_info: {'port': 41001}... -[2023-09-12 21:01:55,857][39685] Decorrelating experience for 32 frames... -[2023-09-12 21:01:55,898][39734] Using port 41001 on host... -[2023-09-12 21:01:55,898][39734] Initializing env for player 1, init_info: {'port': 41001}... -[2023-09-12 21:01:55,931][39698] Initialized w:3 v:1 player:3 -[2023-09-12 21:01:55,933][39698] Initialized w:3 v:1 player:7 -[2023-09-12 21:01:55,933][39698] Initialized w:3 v:1 player:1 -[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:5 -[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:4 -[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:6 -[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:2 -[2023-09-12 21:01:55,934][39698] Initialized w:3 v:1 player:0 -[2023-09-12 21:01:55,937][39698] 8 agent workers initialized for env 3! -[2023-09-12 21:01:55,950][39734] Initializing env for player 2, init_info: {'port': 41001}... -[2023-09-12 21:01:55,969][39733] Initialized w:6 v:1 player:6 -[2023-09-12 21:01:55,971][39733] Initialized w:6 v:1 player:2 -[2023-09-12 21:01:55,971][39733] Initialized w:6 v:1 player:1 -[2023-09-12 21:01:55,972][39733] Initialized w:6 v:1 player:0 -[2023-09-12 21:01:55,972][39733] Initialized w:6 v:1 player:7 -[2023-09-12 21:01:55,972][39733] Initialized w:6 v:1 player:5 -[2023-09-12 21:01:55,973][39733] Initialized w:6 v:1 player:3 -[2023-09-12 21:01:55,973][39733] Initialized w:6 v:1 player:4 -[2023-09-12 21:01:55,974][39733] 8 agent workers initialized for env 6! -[2023-09-12 21:01:55,974][39698] Decorrelating experience for 32 frames... -[2023-09-12 21:01:55,977][39731] Initialized w:4 v:0 player:3 -[2023-09-12 21:01:55,978][39696] Initializing env for player 0, init_info: {'port': 40501}... -[2023-09-12 21:01:55,977][39731] Initialized w:4 v:0 player:2 -[2023-09-12 21:01:55,978][39731] Initialized w:4 v:0 player:6 -[2023-09-12 21:01:55,978][39731] Initialized w:4 v:0 player:1 -[2023-09-12 21:01:55,978][39731] Initialized w:4 v:0 player:5 -[2023-09-12 21:01:55,978][39731] Initialized w:4 v:0 player:7 -[2023-09-12 21:01:55,979][39731] Initialized w:4 v:0 player:4 -[2023-09-12 21:01:55,979][39731] Initialized w:4 v:0 player:0 -[2023-09-12 21:01:55,982][39731] 8 agent workers initialized for env 4! -[2023-09-12 21:01:56,004][39697] Initialized w:1 v:1 player:4 -[2023-09-12 21:01:56,007][39697] Initialized w:1 v:1 player:1 -[2023-09-12 21:01:56,007][39697] Initialized w:1 v:1 player:3 -[2023-09-12 21:01:56,008][39697] Initialized w:1 v:1 player:2 -[2023-09-12 21:01:56,008][39697] Initialized w:1 v:1 player:6 -[2023-09-12 21:01:56,008][39697] Initialized w:1 v:1 player:0 -[2023-09-12 21:01:56,008][39697] Initialized w:1 v:1 player:5 -[2023-09-12 21:01:56,009][39697] Initialized w:1 v:1 player:7 -[2023-09-12 21:01:56,011][39697] 8 agent workers initialized for env 1! -[2023-09-12 21:01:56,015][39734] Initializing env for player 3, init_info: {'port': 41001}... -[2023-09-12 21:01:56,024][39731] Decorrelating experience for 0 frames... -[2023-09-12 21:01:56,024][39696] Using port 40501 on host... -[2023-09-12 21:01:56,029][39731] Port 40701 is available -[2023-09-12 21:01:56,029][39731] Using port 40701 -[2023-09-12 21:01:56,030][39731] Initializing env for player 0, init_info: {'port': 40701}... -[2023-09-12 21:01:56,030][39733] Decorrelating experience for 32 frames... -[2023-09-12 21:01:56,035][39696] Initializing env for player 1, init_info: {'port': 40501}... -[2023-09-12 21:01:56,042][39697] Decorrelating experience for 32 frames... -[2023-09-12 21:01:56,055][39699] Initialized w:5 v:1 player:7 -[2023-09-12 21:01:56,056][39699] Initialized w:5 v:1 player:6 -[2023-09-12 21:01:56,057][39699] Initialized w:5 v:1 player:3 -[2023-09-12 21:01:56,057][39699] Initialized w:5 v:1 player:4 -[2023-09-12 21:01:56,057][39699] Initialized w:5 v:1 player:2 -[2023-09-12 21:01:56,058][39699] Initialized w:5 v:1 player:1 -[2023-09-12 21:01:56,058][39699] Initialized w:5 v:1 player:0 -[2023-09-12 21:01:56,059][39699] Initialized w:5 v:1 player:5 -[2023-09-12 21:01:56,061][39699] 8 agent workers initialized for env 5! -[2023-09-12 21:01:56,067][39734] Initializing env for player 4, init_info: {'port': 41001}... -[2023-09-12 21:01:56,070][39731] Using port 40701 on host... -[2023-09-12 21:01:56,080][39731] Initializing env for player 1, init_info: {'port': 40701}... -[2023-09-12 21:01:56,088][39696] Initializing env for player 2, init_info: {'port': 40501}... -[2023-09-12 21:01:56,096][39699] Decorrelating experience for 32 frames... -[2023-09-12 21:01:56,131][39731] Initializing env for player 2, init_info: {'port': 40701}... -[2023-09-12 21:01:56,126][39734] Initializing env for player 5, init_info: {'port': 41001}... -[2023-09-12 21:01:56,139][39696] Initializing env for player 3, init_info: {'port': 40501}... -[2023-09-12 21:01:56,179][39734] Initializing env for player 6, init_info: {'port': 41001}... -[2023-09-12 21:01:56,183][39731] Initializing env for player 3, init_info: {'port': 40701}... -[2023-09-12 21:01:56,195][39696] Initializing env for player 4, init_info: {'port': 40501}... -[2023-09-12 21:01:56,235][39731] Initializing env for player 4, init_info: {'port': 40701}... -[2023-09-12 21:01:56,241][39696] Initializing env for player 5, init_info: {'port': 40501}... -[2023-09-12 21:01:56,231][39734] Initializing env for player 7, init_info: {'port': 41001}... -[2023-09-12 21:01:56,259][39685] Multi agent env, num agents: 8 -[2023-09-12 21:01:56,284][39731] Initializing env for player 5, init_info: {'port': 40701}... -[2023-09-12 21:01:56,299][39696] Initializing env for player 6, init_info: {'port': 40501}... -[2023-09-12 21:01:56,306][39685] Multi agent env, num agents: 8 -[2023-09-12 21:01:56,338][39731] Initializing env for player 6, init_info: {'port': 40701}... -[2023-09-12 21:01:56,340][39685] Port 40302 is available -[2023-09-12 21:01:56,340][39685] Using port 40302 -[2023-09-12 21:01:56,341][39685] Initializing env for player 0, init_info: {'port': 40302}... -[2023-09-12 21:01:56,360][39696] Initializing env for player 7, init_info: {'port': 40501}... -[2023-09-12 21:01:56,367][39698] Multi agent env, num agents: 8 -[2023-09-12 21:01:56,387][39685] Using port 40302 on host... -[2023-09-12 21:01:56,391][39731] Initializing env for player 7, init_info: {'port': 40701}... -[2023-09-12 21:01:56,398][39685] Initializing env for player 1, init_info: {'port': 40302}... -[2023-09-12 21:01:56,413][39698] Multi agent env, num agents: 8 -[2023-09-12 21:01:56,437][39733] Multi agent env, num agents: 8 -[2023-09-12 21:01:56,455][39685] Initializing env for player 2, init_info: {'port': 40302}... -[2023-09-12 21:01:56,459][39698] Port 40602 is available -[2023-09-12 21:01:56,459][39698] Using port 40602 -[2023-09-12 21:01:56,460][39698] Initializing env for player 0, init_info: {'port': 40602}... -[2023-09-12 21:01:56,482][39733] Multi agent env, num agents: 8 -[2023-09-12 21:01:56,505][39698] Using port 40602 on host... -[2023-09-12 21:01:56,505][39685] Initializing env for player 3, init_info: {'port': 40302}... -[2023-09-12 21:01:56,509][39697] Multi agent env, num agents: 8 -[2023-09-12 21:01:56,516][39698] Initializing env for player 1, init_info: {'port': 40602}... -[2023-09-12 21:01:56,528][39733] Port 40902 is available -[2023-09-12 21:01:56,528][39733] Using port 40902 -[2023-09-12 21:01:56,529][39733] Initializing env for player 0, init_info: {'port': 40902}... -[2023-09-12 21:01:56,553][39697] Multi agent env, num agents: 8 -[2023-09-12 21:01:56,555][39699] Multi agent env, num agents: 8 -[2023-09-12 21:01:56,557][39685] Initializing env for player 4, init_info: {'port': 40302}... -[2023-09-12 21:01:56,566][39698] Initializing env for player 2, init_info: {'port': 40602}... -[2023-09-12 21:01:56,573][39733] Using port 40902 on host... -[2023-09-12 21:01:56,584][39733] Initializing env for player 1, init_info: {'port': 40902}... -[2023-09-12 21:01:56,605][39699] Multi agent env, num agents: 8 -[2023-09-12 21:01:56,611][39685] Initializing env for player 5, init_info: {'port': 40302}... -[2023-09-12 21:01:56,617][39698] Initializing env for player 3, init_info: {'port': 40602}... -[2023-09-12 21:01:56,621][39697] Port 40402 is available -[2023-09-12 21:01:56,621][39697] Using port 40402 -[2023-09-12 21:01:56,622][39697] Initializing env for player 0, init_info: {'port': 40402}... -[2023-09-12 21:01:56,637][39699] Port 40802 is available -[2023-09-12 21:01:56,637][39699] Using port 40802 -[2023-09-12 21:01:56,637][39699] Initializing env for player 0, init_info: {'port': 40802}... -[2023-09-12 21:01:56,644][39733] Initializing env for player 2, init_info: {'port': 40902}... -[2023-09-12 21:01:56,658][39697] Using port 40402 on host... -[2023-09-12 21:01:56,659][39685] Initializing env for player 6, init_info: {'port': 40302}... -[2023-09-12 21:01:56,673][39697] Initializing env for player 1, init_info: {'port': 40402}... -[2023-09-12 21:01:56,676][39698] Initializing env for player 4, init_info: {'port': 40602}... -[2023-09-12 21:01:56,681][39699] Using port 40802 on host... -[2023-09-12 21:01:56,688][39699] Initializing env for player 1, init_info: {'port': 40802}... -[2023-09-12 21:01:56,707][39733] Initializing env for player 3, init_info: {'port': 40902}... -[2023-09-12 21:01:56,713][39685] Initializing env for player 7, init_info: {'port': 40302}... -[2023-09-12 21:01:56,726][39697] Initializing env for player 2, init_info: {'port': 40402}... -[2023-09-12 21:01:56,739][39699] Initializing env for player 2, init_info: {'port': 40802}... -[2023-09-12 21:01:56,747][39698] Initializing env for player 5, init_info: {'port': 40602}... -[2023-09-12 21:01:56,755][39733] Initializing env for player 4, init_info: {'port': 40902}... -[2023-09-12 21:01:56,787][39697] Initializing env for player 3, init_info: {'port': 40402}... -[2023-09-12 21:01:56,790][39699] Initializing env for player 3, init_info: {'port': 40802}... -[2023-09-12 21:01:56,801][39698] Initializing env for player 6, init_info: {'port': 40602}... -[2023-09-12 21:01:56,821][39733] Initializing env for player 5, init_info: {'port': 40902}... -[2023-09-12 21:01:56,851][39698] Initializing env for player 7, init_info: {'port': 40602}... -[2023-09-12 21:01:56,851][39697] Initializing env for player 4, init_info: {'port': 40402}... -[2023-09-12 21:01:56,856][39699] Initializing env for player 4, init_info: {'port': 40802}... -[2023-09-12 21:01:56,883][39733] Initializing env for player 6, init_info: {'port': 40902}... -[2023-09-12 21:01:56,903][39697] Initializing env for player 5, init_info: {'port': 40402}... -[2023-09-12 21:01:56,927][39699] Initializing env for player 5, init_info: {'port': 40802}... -[2023-09-12 21:01:56,935][39733] Initializing env for player 7, init_info: {'port': 40902}... -[2023-09-12 21:01:56,973][39699] Initializing env for player 6, init_info: {'port': 40802}... -[2023-09-12 21:01:57,024][39699] Initializing env for player 7, init_info: {'port': 40802}... -[2023-09-12 21:01:56,971][39697] Initializing env for player 6, init_info: {'port': 40402}... -[2023-09-12 21:01:57,035][39697] Initializing env for player 7, init_info: {'port': 40402}... -[2023-09-12 21:01:57,632][39734] Initialized w:7 v:1 player:1 -[2023-09-12 21:01:57,633][39734] Initialized w:7 v:1 player:2 -[2023-09-12 21:01:57,633][39734] Initialized w:7 v:1 player:0 -[2023-09-12 21:01:57,634][39734] Initialized w:7 v:1 player:4 -[2023-09-12 21:01:57,634][39734] Initialized w:7 v:1 player:3 -[2023-09-12 21:01:57,634][39734] Initialized w:7 v:1 player:7 -[2023-09-12 21:01:57,634][39734] Initialized w:7 v:1 player:6 -[2023-09-12 21:01:57,635][39734] Initialized w:7 v:1 player:5 -[2023-09-12 21:01:57,636][39734] 8 agent workers initialized for env 7! -[2023-09-12 21:01:57,687][39696] Initialized w:2 v:1 player:5 -[2023-09-12 21:01:57,688][39696] Initialized w:2 v:1 player:0 -[2023-09-12 21:01:57,688][39696] Initialized w:2 v:1 player:1 -[2023-09-12 21:01:57,689][39696] Initialized w:2 v:1 player:6 -[2023-09-12 21:01:57,690][39696] Initialized w:2 v:1 player:4 -[2023-09-12 21:01:57,690][39696] Initialized w:2 v:1 player:2 -[2023-09-12 21:01:57,691][39696] Initialized w:2 v:1 player:3 -[2023-09-12 21:01:57,692][39696] Initialized w:2 v:1 player:7 -[2023-09-12 21:01:57,692][39696] 8 agent workers initialized for env 2! -[2023-09-12 21:01:57,710][39734] Decorrelating experience for 32 frames... -[2023-09-12 21:01:57,747][39696] Decorrelating experience for 32 frames... -[2023-09-12 21:01:57,901][39731] Initialized w:4 v:1 player:4 -[2023-09-12 21:01:57,902][39731] Initialized w:4 v:1 player:3 -[2023-09-12 21:01:57,902][39731] Initialized w:4 v:1 player:6 -[2023-09-12 21:01:57,902][39731] Initialized w:4 v:1 player:1 -[2023-09-12 21:01:57,903][39731] Initialized w:4 v:1 player:5 -[2023-09-12 21:01:57,903][39731] Initialized w:4 v:1 player:0 -[2023-09-12 21:01:57,904][39731] Initialized w:4 v:1 player:7 -[2023-09-12 21:01:57,904][39731] Initialized w:4 v:1 player:2 -[2023-09-12 21:01:57,906][39731] 8 agent workers initialized for env 4! -[2023-09-12 21:01:57,948][39731] Decorrelating experience for 32 frames... -[2023-09-12 21:01:58,004][39734] Multi agent env, num agents: 8 -[2023-09-12 21:01:58,038][39734] Multi agent env, num agents: 8 -[2023-09-12 21:01:58,069][39734] Port 41002 is available -[2023-09-12 21:01:58,069][39734] Using port 41002 -[2023-09-12 21:01:58,069][39734] Initializing env for player 0, init_info: {'port': 41002}... -[2023-09-12 21:01:58,100][39734] Using port 41002 on host... -[2023-09-12 21:01:58,120][39734] Initializing env for player 1, init_info: {'port': 41002}... -[2023-09-12 21:01:58,171][39734] Initializing env for player 2, init_info: {'port': 41002}... -[2023-09-12 21:01:58,185][39696] Multi agent env, num agents: 8 -[2023-09-12 21:01:58,227][39734] Initializing env for player 3, init_info: {'port': 41002}... -[2023-09-12 21:01:58,232][39696] Multi agent env, num agents: 8 -[2023-09-12 21:01:58,239][39685] Initialized w:0 v:2 player:2 -[2023-09-12 21:01:58,241][39685] Initialized w:0 v:2 player:6 -[2023-09-12 21:01:58,242][39685] Initialized w:0 v:2 player:3 -[2023-09-12 21:01:58,243][39685] Initialized w:0 v:2 player:1 -[2023-09-12 21:01:58,244][39685] Initialized w:0 v:2 player:5 -[2023-09-12 21:01:58,245][39685] Initialized w:0 v:2 player:0 -[2023-09-12 21:01:58,246][39685] Initialized w:0 v:2 player:4 -[2023-09-12 21:01:58,249][39685] Initialized w:0 v:2 player:7 -[2023-09-12 21:01:58,250][39685] 8 agent workers initialized for env 0! -[2023-09-12 21:01:58,275][39734] Initializing env for player 4, init_info: {'port': 41002}... -[2023-09-12 21:01:58,279][39733] Initialized w:6 v:2 player:3 -[2023-09-12 21:01:58,281][39733] Initialized w:6 v:2 player:7 -[2023-09-12 21:01:58,281][39733] Initialized w:6 v:2 player:0 -[2023-09-12 21:01:58,284][39733] Initialized w:6 v:2 player:5 -[2023-09-12 21:01:58,284][39733] Initialized w:6 v:2 player:1 -[2023-09-12 21:01:58,287][39733] Initialized w:6 v:2 player:6 -[2023-09-12 21:01:58,287][39733] Initialized w:6 v:2 player:2 -[2023-09-12 21:01:58,288][39733] Initialized w:6 v:2 player:4 -[2023-09-12 21:01:58,289][39733] 8 agent workers initialized for env 6! -[2023-09-12 21:01:58,310][39698] Initialized w:3 v:2 player:6 -[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:7 -[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:3 -[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:5 -[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:0 -[2023-09-12 21:01:58,312][39698] Initialized w:3 v:2 player:4 -[2023-09-12 21:01:58,313][39698] Initialized w:3 v:2 player:1 -[2023-09-12 21:01:58,313][39698] Initialized w:3 v:2 player:2 -[2023-09-12 21:01:58,318][39698] 8 agent workers initialized for env 3! -[2023-09-12 21:01:58,327][39734] Initializing env for player 5, init_info: {'port': 41002}... -[2023-09-12 21:01:58,328][39696] Port 40502 is available -[2023-09-12 21:01:58,328][39696] Using port 40502 -[2023-09-12 21:01:58,329][39696] Initializing env for player 0, init_info: {'port': 40502}... -[2023-09-12 21:01:58,329][39685] Decorrelating experience for 64 frames... -[2023-09-12 21:01:58,343][39733] Decorrelating experience for 64 frames... -[2023-09-12 21:01:58,362][39696] Using port 40502 on host... -[2023-09-12 21:01:58,379][39696] Initializing env for player 1, init_info: {'port': 40502}... -[2023-09-12 21:01:58,379][39734] Initializing env for player 6, init_info: {'port': 41002}... -[2023-09-12 21:01:58,384][39698] Decorrelating experience for 64 frames... -[2023-09-12 21:01:58,395][39731] Multi agent env, num agents: 8 -[2023-09-12 21:01:58,431][39696] Initializing env for player 2, init_info: {'port': 40502}... -[2023-09-12 21:01:58,434][39731] Multi agent env, num agents: 8 -[2023-09-12 21:01:58,442][39734] Initializing env for player 7, init_info: {'port': 41002}... -[2023-09-12 21:01:58,471][39731] Port 40702 is available -[2023-09-12 21:01:58,471][39731] Using port 40702 -[2023-09-12 21:01:58,472][39731] Initializing env for player 0, init_info: {'port': 40702}... -[2023-09-12 21:01:58,487][39696] Initializing env for player 3, init_info: {'port': 40502}... -[2023-09-12 21:01:58,509][39731] Using port 40702 on host... -[2023-09-12 21:01:58,522][39731] Initializing env for player 1, init_info: {'port': 40702}... -[2023-09-12 21:01:58,547][39696] Initializing env for player 4, init_info: {'port': 40502}... -[2023-09-12 21:01:58,571][39697] Initialized w:1 v:2 player:6 -[2023-09-12 21:01:58,575][39731] Initializing env for player 2, init_info: {'port': 40702}... -[2023-09-12 21:01:58,577][39697] Initialized w:1 v:2 player:7 -[2023-09-12 21:01:58,577][39697] Initialized w:1 v:2 player:0 -[2023-09-12 21:01:58,578][39697] Initialized w:1 v:2 player:1 -[2023-09-12 21:01:58,578][39697] Initialized w:1 v:2 player:4 -[2023-09-12 21:01:58,578][39697] Initialized w:1 v:2 player:3 -[2023-09-12 21:01:58,578][39697] Initialized w:1 v:2 player:2 -[2023-09-12 21:01:58,579][39697] Initialized w:1 v:2 player:5 -[2023-09-12 21:01:58,583][39697] 8 agent workers initialized for env 1! -[2023-09-12 21:01:58,594][39696] Initializing env for player 5, init_info: {'port': 40502}... -[2023-09-12 21:01:58,615][39699] Initialized w:5 v:2 player:6 -[2023-09-12 21:01:58,619][39699] Initialized w:5 v:2 player:0 -[2023-09-12 21:01:58,620][39699] Initialized w:5 v:2 player:2 -[2023-09-12 21:01:58,623][39699] Initialized w:5 v:2 player:3 -[2023-09-12 21:01:58,625][39699] Initialized w:5 v:2 player:5 -[2023-09-12 21:01:58,626][39699] Initialized w:5 v:2 player:7 -[2023-09-12 21:01:58,626][39699] Initialized w:5 v:2 player:4 -[2023-09-12 21:01:58,627][39699] Initialized w:5 v:2 player:1 -[2023-09-12 21:01:58,627][39731] Initializing env for player 3, init_info: {'port': 40702}... -[2023-09-12 21:01:58,628][39699] 8 agent workers initialized for env 5! -[2023-09-12 21:01:58,641][39697] Decorrelating experience for 64 frames... -[2023-09-12 21:01:58,655][39696] Initializing env for player 6, init_info: {'port': 40502}... -[2023-09-12 21:01:58,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:01:58,678][39731] Initializing env for player 4, init_info: {'port': 40702}... -[2023-09-12 21:01:58,707][39696] Initializing env for player 7, init_info: {'port': 40502}... -[2023-09-12 21:01:58,717][39699] Decorrelating experience for 64 frames... -[2023-09-12 21:01:58,731][39731] Initializing env for player 5, init_info: {'port': 40702}... -[2023-09-12 21:01:58,795][39731] Initializing env for player 6, init_info: {'port': 40702}... -[2023-09-12 21:01:58,871][39731] Initializing env for player 7, init_info: {'port': 40702}... -[2023-09-12 21:01:59,191][39733] Port 40903 is available -[2023-09-12 21:01:59,191][39733] Using port 40903 -[2023-09-12 21:01:59,192][39733] Initializing env for player 0, init_info: {'port': 40903}... -[2023-09-12 21:01:59,221][39733] Using port 40903 on host... -[2023-09-12 21:01:59,243][39733] Initializing env for player 1, init_info: {'port': 40903}... -[2023-09-12 21:01:59,293][39733] Initializing env for player 2, init_info: {'port': 40903}... -[2023-09-12 21:01:59,302][39685] Port 40303 is available -[2023-09-12 21:01:59,302][39685] Using port 40303 -[2023-09-12 21:01:59,302][39685] Initializing env for player 0, init_info: {'port': 40303}... -[2023-09-12 21:01:59,347][39685] Using port 40303 on host... -[2023-09-12 21:01:59,347][39698] Port 40603 is available -[2023-09-12 21:01:59,348][39698] Using port 40603 -[2023-09-12 21:01:59,347][39733] Initializing env for player 3, init_info: {'port': 40903}... -[2023-09-12 21:01:59,348][39698] Initializing env for player 0, init_info: {'port': 40603}... -[2023-09-12 21:01:59,360][39685] Initializing env for player 1, init_info: {'port': 40303}... -[2023-09-12 21:01:59,392][39698] Using port 40603 on host... -[2023-09-12 21:01:59,402][39698] Initializing env for player 1, init_info: {'port': 40603}... -[2023-09-12 21:01:59,409][39733] Initializing env for player 4, init_info: {'port': 40903}... -[2023-09-12 21:01:59,419][39685] Initializing env for player 2, init_info: {'port': 40303}... -[2023-09-12 21:01:59,459][39698] Initializing env for player 2, init_info: {'port': 40603}... -[2023-09-12 21:01:59,467][39733] Initializing env for player 5, init_info: {'port': 40903}... -[2023-09-12 21:01:59,470][39685] Initializing env for player 3, init_info: {'port': 40303}... -[2023-09-12 21:01:59,517][39698] Initializing env for player 3, init_info: {'port': 40603}... -[2023-09-12 21:01:59,519][39733] Initializing env for player 6, init_info: {'port': 40903}... -[2023-09-12 21:01:59,523][39685] Initializing env for player 4, init_info: {'port': 40303}... -[2023-09-12 21:01:59,575][39685] Initializing env for player 5, init_info: {'port': 40303}... -[2023-09-12 21:01:59,575][39698] Initializing env for player 4, init_info: {'port': 40603}... -[2023-09-12 21:01:59,578][39733] Initializing env for player 7, init_info: {'port': 40903}... -[2023-09-12 21:01:59,592][39697] Port 40403 is available -[2023-09-12 21:01:59,592][39697] Using port 40403 -[2023-09-12 21:01:59,592][39697] Initializing env for player 0, init_info: {'port': 40403}... -[2023-09-12 21:01:59,623][39698] Initializing env for player 5, init_info: {'port': 40603}... -[2023-09-12 21:01:59,629][39697] Using port 40403 on host... -[2023-09-12 21:01:59,643][39697] Initializing env for player 1, init_info: {'port': 40403}... -[2023-09-12 21:01:59,664][39685] Initializing env for player 6, init_info: {'port': 40303}... -[2023-09-12 21:01:59,664][39699] Port 40803 is available -[2023-09-12 21:01:59,665][39699] Using port 40803 -[2023-09-12 21:01:59,665][39699] Initializing env for player 0, init_info: {'port': 40803}... -[2023-09-12 21:01:59,694][39697] Initializing env for player 2, init_info: {'port': 40403}... -[2023-09-12 21:01:59,695][39698] Initializing env for player 6, init_info: {'port': 40603}... -[2023-09-12 21:01:59,707][39699] Using port 40803 on host... -[2023-09-12 21:01:59,718][39699] Initializing env for player 1, init_info: {'port': 40803}... -[2023-09-12 21:01:59,719][39685] Initializing env for player 7, init_info: {'port': 40303}... -[2023-09-12 21:01:59,744][39697] Initializing env for player 3, init_info: {'port': 40403}... -[2023-09-12 21:01:59,751][39698] Initializing env for player 7, init_info: {'port': 40603}... -[2023-09-12 21:01:59,768][39699] Initializing env for player 2, init_info: {'port': 40803}... -[2023-09-12 21:01:59,795][39697] Initializing env for player 4, init_info: {'port': 40403}... -[2023-09-12 21:01:59,819][39699] Initializing env for player 3, init_info: {'port': 40803}... -[2023-09-12 21:01:59,857][39697] Initializing env for player 5, init_info: {'port': 40403}... -[2023-09-12 21:01:59,871][39699] Initializing env for player 4, init_info: {'port': 40803}... -[2023-09-12 21:01:59,887][39734] Initialized w:7 v:2 player:3 -[2023-09-12 21:01:59,888][39734] Initialized w:7 v:2 player:6 -[2023-09-12 21:01:59,889][39734] Initialized w:7 v:2 player:2 -[2023-09-12 21:01:59,890][39734] Initialized w:7 v:2 player:1 -[2023-09-12 21:01:59,890][39734] Initialized w:7 v:2 player:7 -[2023-09-12 21:01:59,891][39734] Initialized w:7 v:2 player:5 -[2023-09-12 21:01:59,891][39734] Initialized w:7 v:2 player:0 -[2023-09-12 21:01:59,892][39734] Initialized w:7 v:2 player:4 -[2023-09-12 21:01:59,893][39734] 8 agent workers initialized for env 7! -[2023-09-12 21:01:59,911][39697] Initializing env for player 6, init_info: {'port': 40403}... -[2023-09-12 21:01:59,931][39699] Initializing env for player 5, init_info: {'port': 40803}... -[2023-09-12 21:01:59,942][39734] Decorrelating experience for 64 frames... -[2023-09-12 21:01:59,967][39697] Initializing env for player 7, init_info: {'port': 40403}... -[2023-09-12 21:01:59,979][39699] Initializing env for player 6, init_info: {'port': 40803}... -[2023-09-12 21:02:00,039][39699] Initializing env for player 7, init_info: {'port': 40803}... -[2023-09-12 21:02:00,070][39696] Initialized w:2 v:2 player:2 -[2023-09-12 21:02:00,072][39696] Initialized w:2 v:2 player:6 -[2023-09-12 21:02:00,072][39696] Initialized w:2 v:2 player:7 -[2023-09-12 21:02:00,073][39696] Initialized w:2 v:2 player:1 -[2023-09-12 21:02:00,073][39696] Initialized w:2 v:2 player:5 -[2023-09-12 21:02:00,074][39696] Initialized w:2 v:2 player:0 -[2023-09-12 21:02:00,074][39696] Initialized w:2 v:2 player:3 -[2023-09-12 21:02:00,074][39696] Initialized w:2 v:2 player:4 -[2023-09-12 21:02:00,076][39696] 8 agent workers initialized for env 2! -[2023-09-12 21:02:00,122][39696] Decorrelating experience for 64 frames... -[2023-09-12 21:02:00,279][39731] Initialized w:4 v:2 player:5 -[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:2 -[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:0 -[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:3 -[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:4 -[2023-09-12 21:02:00,280][39731] Initialized w:4 v:2 player:1 -[2023-09-12 21:02:00,282][39731] Initialized w:4 v:2 player:7 -[2023-09-12 21:02:00,282][39731] Initialized w:4 v:2 player:6 -[2023-09-12 21:02:00,283][39731] 8 agent workers initialized for env 4! -[2023-09-12 21:02:00,332][39731] Decorrelating experience for 64 frames... -[2023-09-12 21:02:00,573][39734] Port 41003 is available -[2023-09-12 21:02:00,573][39734] Using port 41003 -[2023-09-12 21:02:00,573][39734] Initializing env for player 0, init_info: {'port': 41003}... -[2023-09-12 21:02:00,605][39734] Using port 41003 on host... -[2023-09-12 21:02:00,624][39734] Initializing env for player 1, init_info: {'port': 41003}... -[2023-09-12 21:02:00,674][39734] Initializing env for player 2, init_info: {'port': 41003}... -[2023-09-12 21:02:00,727][39734] Initializing env for player 3, init_info: {'port': 41003}... -[2023-09-12 21:02:00,775][39734] Initializing env for player 4, init_info: {'port': 41003}... -[2023-09-12 21:02:00,838][39696] Port 40503 is available -[2023-09-12 21:02:00,838][39696] Using port 40503 -[2023-09-12 21:02:00,838][39696] Initializing env for player 0, init_info: {'port': 40503}... -[2023-09-12 21:02:00,847][39734] Initializing env for player 5, init_info: {'port': 41003}... -[2023-09-12 21:02:00,867][39696] Using port 40503 on host... -[2023-09-12 21:02:00,889][39696] Initializing env for player 1, init_info: {'port': 40503}... -[2023-09-12 21:02:00,891][39734] Initializing env for player 6, init_info: {'port': 41003}... -[2023-09-12 21:02:00,925][39731] Port 40703 is available -[2023-09-12 21:02:00,925][39731] Using port 40703 -[2023-09-12 21:02:00,926][39731] Initializing env for player 0, init_info: {'port': 40703}... -[2023-09-12 21:02:00,943][39734] Initializing env for player 7, init_info: {'port': 41003}... -[2023-09-12 21:02:00,949][39696] Initializing env for player 2, init_info: {'port': 40503}... -[2023-09-12 21:02:00,968][39733] Initialized w:6 v:3 player:5 -[2023-09-12 21:02:00,969][39733] Initialized w:6 v:3 player:6 -[2023-09-12 21:02:00,969][39733] Initialized w:6 v:3 player:1 -[2023-09-12 21:02:00,970][39733] Initialized w:6 v:3 player:2 -[2023-09-12 21:02:00,971][39731] Using port 40703 on host... -[2023-09-12 21:02:00,970][39733] Initialized w:6 v:3 player:7 -[2023-09-12 21:02:00,971][39733] Initialized w:6 v:3 player:3 -[2023-09-12 21:02:00,971][39733] Initialized w:6 v:3 player:4 -[2023-09-12 21:02:00,972][39733] Initialized w:6 v:3 player:0 -[2023-09-12 21:02:00,973][39733] 8 agent workers initialized for env 6! -[2023-09-12 21:02:00,984][39731] Initializing env for player 1, init_info: {'port': 40703}... -[2023-09-12 21:02:00,999][39696] Initializing env for player 3, init_info: {'port': 40503}... -[2023-09-12 21:02:01,016][39733] Decorrelating experience for 96 frames... -[2023-09-12 21:02:01,031][39685] Initialized w:0 v:3 player:3 -[2023-09-12 21:02:01,033][39685] Initialized w:0 v:3 player:6 -[2023-09-12 21:02:01,034][39685] Initialized w:0 v:3 player:5 -[2023-09-12 21:02:01,034][39685] Initialized w:0 v:3 player:7 -[2023-09-12 21:02:01,035][39685] Initialized w:0 v:3 player:1 -[2023-09-12 21:02:01,035][39685] Initialized w:0 v:3 player:0 -[2023-09-12 21:02:01,039][39685] Initialized w:0 v:3 player:4 -[2023-09-12 21:02:01,042][39731] Initializing env for player 2, init_info: {'port': 40703}... -[2023-09-12 21:02:01,051][39696] Initializing env for player 4, init_info: {'port': 40503}... -[2023-09-12 21:02:01,095][39731] Initializing env for player 3, init_info: {'port': 40703}... -[2023-09-12 21:02:01,129][39696] Initializing env for player 5, init_info: {'port': 40503}... -[2023-09-12 21:02:01,153][39698] Initialized w:3 v:3 player:6 -[2023-09-12 21:02:01,157][39698] Initialized w:3 v:3 player:4 -[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:5 -[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:1 -[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:2 -[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:0 -[2023-09-12 21:02:01,159][39698] Initialized w:3 v:3 player:7 -[2023-09-12 21:02:01,160][39698] Initialized w:3 v:3 player:3 -[2023-09-12 21:02:01,162][39698] 8 agent workers initialized for env 3! -[2023-09-12 21:02:01,180][39731] Initializing env for player 4, init_info: {'port': 40703}... -[2023-09-12 21:02:01,183][39696] Initializing env for player 6, init_info: {'port': 40503}... -[2023-09-12 21:02:01,233][39731] Initializing env for player 5, init_info: {'port': 40703}... -[2023-09-12 21:02:01,236][39698] Decorrelating experience for 96 frames... -[2023-09-12 21:02:01,251][39696] Initializing env for player 7, init_info: {'port': 40503}... -[2023-09-12 21:02:01,303][39731] Initializing env for player 6, init_info: {'port': 40703}... -[2023-09-12 21:02:01,369][39731] Initializing env for player 7, init_info: {'port': 40703}... -[2023-09-12 21:02:01,413][39697] Initialized w:1 v:3 player:3 -[2023-09-12 21:02:01,415][39697] Initialized w:1 v:3 player:7 -[2023-09-12 21:02:01,417][39697] Initialized w:1 v:3 player:0 -[2023-09-12 21:02:01,417][39697] Initialized w:1 v:3 player:2 -[2023-09-12 21:02:01,418][39697] Initialized w:1 v:3 player:1 -[2023-09-12 21:02:01,420][39697] Initialized w:1 v:3 player:6 -[2023-09-12 21:02:01,421][39697] Initialized w:1 v:3 player:4 -[2023-09-12 21:02:01,422][39697] Initialized w:1 v:3 player:5 -[2023-09-12 21:02:01,423][39697] 8 agent workers initialized for env 1! -[2023-09-12 21:02:01,459][39699] Initialized w:5 v:3 player:7 -[2023-09-12 21:02:01,461][39699] Initialized w:5 v:3 player:5 -[2023-09-12 21:02:01,462][39699] Initialized w:5 v:3 player:6 -[2023-09-12 21:02:01,463][39699] Initialized w:5 v:3 player:0 -[2023-09-12 21:02:01,461][39699] Initialized w:5 v:3 player:1 -[2023-09-12 21:02:01,466][39699] Initialized w:5 v:3 player:2 -[2023-09-12 21:02:01,466][39699] Initialized w:5 v:3 player:4 -[2023-09-12 21:02:01,466][39699] Initialized w:5 v:3 player:3 -[2023-09-12 21:02:01,467][39699] 8 agent workers initialized for env 5! -[2023-09-12 21:02:01,494][39697] Decorrelating experience for 96 frames... -[2023-09-12 21:02:01,540][39699] Decorrelating experience for 96 frames... -[2023-09-12 21:02:02,032][39685] Initialized w:0 v:3 player:2 -[2023-09-12 21:02:02,033][39685] 8 agent workers initialized for env 0! -[2023-09-12 21:02:02,105][39685] Decorrelating experience for 96 frames... -[2023-09-12 21:02:02,510][39734] Initialized w:7 v:3 player:2 -[2023-09-12 21:02:02,511][39734] Initialized w:7 v:3 player:7 -[2023-09-12 21:02:02,512][39734] Initialized w:7 v:3 player:4 -[2023-09-12 21:02:02,512][39734] Initialized w:7 v:3 player:5 -[2023-09-12 21:02:02,512][39734] Initialized w:7 v:3 player:1 -[2023-09-12 21:02:02,513][39734] Initialized w:7 v:3 player:0 -[2023-09-12 21:02:02,513][39734] Initialized w:7 v:3 player:3 -[2023-09-12 21:02:02,514][39734] Initialized w:7 v:3 player:6 -[2023-09-12 21:02:02,515][39734] 8 agent workers initialized for env 7! -[2023-09-12 21:02:02,555][39734] Decorrelating experience for 96 frames... -[2023-09-12 21:02:02,559][39696] Initialized w:2 v:3 player:6 -[2023-09-12 21:02:02,560][39696] Initialized w:2 v:3 player:2 -[2023-09-12 21:02:02,560][39696] Initialized w:2 v:3 player:1 -[2023-09-12 21:02:02,560][39696] Initialized w:2 v:3 player:4 -[2023-09-12 21:02:02,560][39696] Initialized w:2 v:3 player:5 -[2023-09-12 21:02:02,561][39696] Initialized w:2 v:3 player:0 -[2023-09-12 21:02:02,561][39696] Initialized w:2 v:3 player:3 -[2023-09-12 21:02:02,561][39696] Initialized w:2 v:3 player:7 -[2023-09-12 21:02:02,563][39696] 8 agent workers initialized for env 2! -[2023-09-12 21:02:02,612][39696] Decorrelating experience for 96 frames... -[2023-09-12 21:02:02,881][39731] Initialized w:4 v:3 player:3 -[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:1 -[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:6 -[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:5 -[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:2 -[2023-09-12 21:02:02,883][39731] Initialized w:4 v:3 player:7 -[2023-09-12 21:02:02,884][39731] Initialized w:4 v:3 player:4 -[2023-09-12 21:02:02,884][39731] Initialized w:4 v:3 player:0 -[2023-09-12 21:02:02,887][39731] 8 agent workers initialized for env 4! -[2023-09-12 21:02:02,948][39731] Decorrelating experience for 96 frames... -[2023-09-12 21:02:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 0. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:02:05,178][39537] Signal inference workers to stop experience collection... -[2023-09-12 21:02:05,203][39686] InferenceWorker_p0-w0: stopping experience collection -[2023-09-12 21:02:06,207][39537] EvtLoop [learner_proc0_evt_loop, process=learner_proc0] unhandled exception in slot='on_new_training_batch' connected to emitter=Emitter(object_id='Batcher_0', signal_name='training_batches_available'), args=(0,) -Traceback (most recent call last): - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/signal_slot/signal_slot.py", line 355, in _process_signal - slot_callable(*args) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner_worker.py", line 150, in on_new_training_batch - stats = self.learner.train(self.batcher.training_batches[batch_idx]) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 1046, in train - train_stats = self._train(buff, self.cfg.batch_size, experience_size, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 731, in _train - ) = self._calculate_losses(mb, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 649, in _calculate_losses - exploration_loss = self.exploration_loss_func(action_distribution, valids, num_invalids) - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/learning/learner.py", line 477, in _symmetric_kl_exploration_loss - kl_prior = action_distribution.symmetric_kl_with_uniform_prior() - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py", line 247, in symmetric_kl_with_uniform_prior - sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions] - File "/home/cogstack/.local/share/virtualenvs/sample_factory--NQNquiM/lib/python3.10/site-packages/sample_factory/algo/utils/action_distributions.py", line 247, in - sym_kls = [d.symmetric_kl_with_uniform_prior().unsqueeze(dim=1) for d in self.distributions] -AttributeError: 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' -[2023-09-12 21:02:06,208][39537] Unhandled exception 'ContinuousActionDistribution' object has no attribute 'symmetric_kl_with_uniform_prior' in evt loop learner_proc0_evt_loop -[2023-09-12 21:02:06,931][28625] Heartbeat connected on Batcher_0 -[2023-09-12 21:02:06,938][28625] Heartbeat connected on InferenceWorker_p0-w0 -[2023-09-12 21:02:06,944][28625] Heartbeat connected on RolloutWorker_w0 -[2023-09-12 21:02:06,949][28625] Heartbeat connected on RolloutWorker_w1 -[2023-09-12 21:02:06,953][28625] Heartbeat connected on RolloutWorker_w2 -[2023-09-12 21:02:06,957][28625] Heartbeat connected on RolloutWorker_w3 -[2023-09-12 21:02:06,961][28625] Heartbeat connected on RolloutWorker_w4 -[2023-09-12 21:02:06,965][28625] Heartbeat connected on RolloutWorker_w5 -[2023-09-12 21:02:06,968][28625] Heartbeat connected on RolloutWorker_w6 -[2023-09-12 21:02:06,973][28625] Heartbeat connected on RolloutWorker_w7 -[2023-09-12 21:02:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 483.2. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:02:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 362.4. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:02:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 289.9. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:02:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 241.6. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:02:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 207.1. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:02:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 181.2. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:02:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 161.1. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:02:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 161.1. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:02:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 161.1. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:02:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:02:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:03:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:03:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:03:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:03:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:03:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:03:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:03:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:03:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:03:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:03:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:03:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:03:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:04:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:04:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:04:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:04:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:04:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:04:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:04:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:04:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:04:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:04:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:04:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:04:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:05:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:05:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:05:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:05:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:05:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:05:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:05:33,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:05:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:05:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:05:48,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:05:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:05:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:06:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:06:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:06:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:06:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:06:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:06:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:06:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:06:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:06:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:06:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:06:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:06:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:07:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:07:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:07:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:07:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:07:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:07:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:07:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:07:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:07:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:07:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:07:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:07:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:08:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:08:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:08:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:08:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:08:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:08:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:08:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:08:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:08:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:08:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:08:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:08:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:09:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:09:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:09:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:09:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:09:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:09:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:09:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:09:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:09:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:09:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:09:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:09:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:10:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:10:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:10:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:10:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:10:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:10:28,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:10:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:10:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:10:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:10:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:10:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:10:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:11:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:11:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:11:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:11:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:11:23,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:11:28,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:11:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:11:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:11:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:11:43,670][28625] Components not started: LearnerWorker_p0, wait_time=600.0 seconds -[2023-09-12 21:11:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:11:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:11:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:12:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:12:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:12:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:12:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:12:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:12:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:12:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:12:38,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:12:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:12:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:12:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:12:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:13:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:13:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:13:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:13:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:13:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:13:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:13:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:13:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:13:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:13:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:13:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:13:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:14:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:14:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:14:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:14:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:14:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:14:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:14:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:14:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:14:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:14:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:14:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:14:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:15:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:15:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:15:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:15:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:15:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:15:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:15:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:15:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:15:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:15:48,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:15:53,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:15:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:16:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:16:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:16:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:16:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:16:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:16:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:16:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:16:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:16:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:16:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:16:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:16:58,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:17:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:17:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:17:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:17:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:17:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:17:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:17:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:17:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:17:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:17:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:17:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:17:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:18:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:18:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:18:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:18:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:18:23,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:18:28,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:18:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:18:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:18:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:18:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:18:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:18:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:19:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:19:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:19:13,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:19:18,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:19:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:19:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:19:33,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:19:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:19:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:19:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:19:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:19:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:20:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:20:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:20:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:20:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:20:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:20:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:20:33,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:20:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:20:43,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:20:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:20:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:20:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:21:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:21:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:21:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:21:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:21:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:21:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:21:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:21:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:21:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:21:43,670][28625] Components not started: LearnerWorker_p0, wait_time=1200.0 seconds -[2023-09-12 21:21:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:21:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:21:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:22:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:22:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:22:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:22:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:22:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:22:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:22:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:22:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:22:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:22:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:22:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:22:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:23:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:23:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:23:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:23:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:23:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:23:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:23:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:23:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:23:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:23:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:23:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:23:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:24:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:24:08,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:24:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:24:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:24:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:24:28,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:24:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:24:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:24:43,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:24:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:24:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:24:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:25:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:25:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:25:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:25:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:25:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:25:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:25:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:25:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:25:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:25:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:25:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:25:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:26:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:26:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:26:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:26:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:26:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:26:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:26:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:26:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:26:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:26:48,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:26:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:26:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:27:03,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:27:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:27:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:27:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:27:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:27:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:27:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:27:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:27:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:27:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:27:53,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:27:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:28:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:28:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:28:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:28:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:28:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:28:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:28:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:28:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:28:43,664][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:28:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:28:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:28:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:29:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:29:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:29:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:29:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:29:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:29:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:29:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:29:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:29:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:29:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:29:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:29:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:30:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:30:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:30:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:30:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:30:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:30:28,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:30:33,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:30:38,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:30:43,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:30:48,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:30:53,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:30:58,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:31:03,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:31:08,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:31:13,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:31:18,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:31:23,665][28625] Fps is (10 sec: 0.0, 60 sec: 0.0, 300 sec: 0.0). Total num frames: 0. Throughput: 0: 0.0. Samples: 7248. Policy #0 lag: (min: -1.0, avg: -1.0, max: -1.0) -[2023-09-12 21:31:27,821][28625] Keyboard interrupt detected in the event loop EvtLoop [Runner_EvtLoop, process=main process 28625], exiting... -[2023-09-12 21:31:27,824][39537] Stopping Batcher_0... -[2023-09-12 21:31:27,823][28625] Runner profile tree view: -main_loop: 1780.8502 -[2023-09-12 21:31:27,825][39537] Loop batcher_evt_loop terminating... -[2023-09-12 21:31:27,825][28625] Collected {0: 0}, FPS: 0.0 -[2023-09-12 21:31:27,841][39686] Weights refcount: 2 0 -[2023-09-12 21:31:27,842][39686] Stopping InferenceWorker_p0-w0... -[2023-09-12 21:31:27,842][39686] Loop inference_proc0-0_evt_loop terminating... -[2023-09-12 21:31:27,858][28625] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json -[2023-09-12 21:31:27,861][28625] Overriding arg 'num_workers' with value 1 passed from command line -[2023-09-12 21:31:27,866][28625] Adding new argument 'no_render'=True that is not in the saved config file! -[2023-09-12 21:31:27,872][28625] Adding new argument 'save_video'=True that is not in the saved config file! -[2023-09-12 21:31:27,878][28625] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file! -[2023-09-12 21:31:27,881][28625] Adding new argument 'video_name'=None that is not in the saved config file! -[2023-09-12 21:31:27,882][28625] Adding new argument 'max_num_frames'=100000 that is not in the saved config file! -[2023-09-12 21:31:27,882][28625] Adding new argument 'max_num_episodes'=10 that is not in the saved config file! -[2023-09-12 21:31:27,883][28625] Adding new argument 'push_to_hub'=True that is not in the saved config file! -[2023-09-12 21:31:27,884][28625] Adding new argument 'hf_repository'='MattStammers/vizdoom_fight' that is not in the saved config file! -[2023-09-12 21:31:27,885][28625] Adding new argument 'policy_index'=0 that is not in the saved config file! -[2023-09-12 21:31:27,886][28625] Adding new argument 'eval_deterministic'=False that is not in the saved config file! -[2023-09-12 21:31:27,886][28625] Adding new argument 'train_script'=None that is not in the saved config file! -[2023-09-12 21:31:27,887][28625] Adding new argument 'enjoy_script'=None that is not in the saved config file! -[2023-09-12 21:31:27,888][28625] Using frameskip 1 and render_action_repeat=4 for evaluation -[2023-09-12 21:31:27,888][28625] Multi agent env, num agents: 8 -[2023-09-12 21:31:27,915][28625] RunningMeanStd input shape: (23,) -[2023-09-12 21:31:27,917][28625] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 21:31:27,918][28625] RunningMeanStd input shape: (1,) -[2023-09-12 21:31:27,930][28625] ConvEncoder: input_channels=3 -[2023-09-12 21:31:27,999][28625] Conv encoder output size: 512 -[2023-09-12 21:31:28,001][28625] Policy head output size: 640 -[2023-09-12 21:31:28,058][28625] No checkpoints found -[2023-09-12 21:31:30,420][28625] Loading existing experiment configuration from /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/config.json -[2023-09-12 21:31:30,421][28625] Overriding arg 'num_workers' with value 1 passed from command line -[2023-09-12 21:31:30,423][28625] Adding new argument 'no_render'=True that is not in the saved config file! -[2023-09-12 21:31:30,424][28625] Adding new argument 'save_video'=True that is not in the saved config file! -[2023-09-12 21:31:30,426][28625] Adding new argument 'video_frames'=1000000000.0 that is not in the saved config file! -[2023-09-12 21:31:30,427][28625] Adding new argument 'video_name'=None that is not in the saved config file! -[2023-09-12 21:31:30,429][28625] Adding new argument 'max_num_frames'=100000 that is not in the saved config file! -[2023-09-12 21:31:30,430][28625] Adding new argument 'max_num_episodes'=10 that is not in the saved config file! -[2023-09-12 21:31:30,431][28625] Adding new argument 'push_to_hub'=True that is not in the saved config file! -[2023-09-12 21:31:30,434][28625] Adding new argument 'hf_repository'='MattStammers/vizdoom_fight' that is not in the saved config file! -[2023-09-12 21:31:30,436][28625] Adding new argument 'policy_index'=0 that is not in the saved config file! -[2023-09-12 21:31:30,436][28625] Adding new argument 'eval_deterministic'=False that is not in the saved config file! -[2023-09-12 21:31:30,437][28625] Adding new argument 'train_script'=None that is not in the saved config file! -[2023-09-12 21:31:30,438][28625] Adding new argument 'enjoy_script'=None that is not in the saved config file! -[2023-09-12 21:31:30,439][28625] Using frameskip 1 and render_action_repeat=4 for evaluation -[2023-09-12 21:31:30,440][28625] Multi agent env, num agents: 8 -[2023-09-12 21:31:30,467][28625] RunningMeanStd input shape: (23,) -[2023-09-12 21:31:30,469][28625] RunningMeanStd input shape: (3, 72, 128) -[2023-09-12 21:31:30,469][28625] RunningMeanStd input shape: (1,) -[2023-09-12 21:31:30,479][28625] ConvEncoder: input_channels=3 -[2023-09-12 21:31:30,517][28625] Conv encoder output size: 512 -[2023-09-12 21:31:30,520][28625] Policy head output size: 640 -[2023-09-12 21:31:30,549][28625] No checkpoints found -[2023-09-12 21:31:31,039][39699] Stopping RolloutWorker_w5... -[2023-09-12 21:31:31,040][39699] Loop rollout_proc5_evt_loop terminating... -[2023-09-12 21:31:31,041][39697] Stopping RolloutWorker_w1... -[2023-09-12 21:31:31,042][39731] Stopping RolloutWorker_w4... -[2023-09-12 21:31:31,042][39697] Loop rollout_proc1_evt_loop terminating... -[2023-09-12 21:31:31,042][39731] Loop rollout_proc4_evt_loop terminating... -[2023-09-12 21:31:31,045][39734] Stopping RolloutWorker_w7... -[2023-09-12 21:31:31,045][39734] Loop rollout_proc7_evt_loop terminating... -[2023-09-12 21:31:31,050][39685] Stopping RolloutWorker_w0... -[2023-09-12 21:31:31,050][39685] Loop rollout_proc0_evt_loop terminating... -[2023-09-12 21:31:31,114][39733] Stopping RolloutWorker_w6... -[2023-09-12 21:31:31,115][39733] Loop rollout_proc6_evt_loop terminating... -[2023-09-12 21:31:31,121][39698] Stopping RolloutWorker_w3... -[2023-09-12 21:31:31,121][39698] Loop rollout_proc3_evt_loop terminating... -[2023-09-12 21:31:31,150][39696] Stopping RolloutWorker_w2... -[2023-09-12 21:31:31,151][39696] Loop rollout_proc2_evt_loop terminating... +[2023-09-14 14:36:34,638][63576] Using optimizer +[2023-09-14 14:36:34,639][63576] No checkpoints found +[2023-09-14 14:36:34,639][63576] Did not load from checkpoint, starting from scratch! +[2023-09-14 14:36:34,639][63576] Initialized policy 1 weights for model version 0 +[2023-09-14 14:36:34,641][63576] LearnerWorker_p1 finished initialization! +[2023-09-14 14:36:34,641][63576] Using GPUs [0] for process 1 (actually maps to GPUs [1]) +[2023-09-14 14:36:34,966][63732] Using GPUs [0] for process 0 (actually maps to GPUs [0]) +[2023-09-14 14:36:34,966][63732] Set environment var CUDA_VISIBLE_DEVICES to '0' (GPU indices [0]) for inference process 0 +[2023-09-14 14:36:34,984][63732] Num visible devices: 1 +[2023-09-14 14:36:35,027][63734] Worker 1 uses CPU cores [4, 5, 6, 7] +[2023-09-14 14:36:35,040][63806] Worker 7 uses CPU cores [28, 29, 30, 31] +[2023-09-14 14:36:35,099][63770] Worker 4 uses CPU cores [16, 17, 18, 19] +[2023-09-14 14:36:35,180][63769] Worker 3 uses CPU cores [12, 13, 14, 15] +[2023-09-14 14:36:35,289][63771] Worker 5 uses CPU cores [20, 21, 22, 23] +[2023-09-14 14:36:35,305][63767] Worker 2 uses CPU cores [8, 9, 10, 11] +[2023-09-14 14:36:35,343][63733] Using GPUs [1] for process 1 (actually maps to GPUs [1]) +[2023-09-14 14:36:35,343][63733] Set environment var CUDA_VISIBLE_DEVICES to '1' (GPU indices [1]) for inference process 1 +[2023-09-14 14:36:35,362][63733] Num visible devices: 1 +[2023-09-14 14:36:35,504][63805] Worker 6 uses CPU cores [24, 25, 26, 27] +[2023-09-14 14:36:35,539][63735] Worker 0 uses CPU cores [0, 1, 2, 3] +[2023-09-14 14:36:35,629][63732] RunningMeanStd input shape: (23,) +[2023-09-14 14:36:35,629][63732] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 14:36:35,630][63732] RunningMeanStd input shape: (1,) +[2023-09-14 14:36:35,642][63732] ConvEncoder: input_channels=3 +[2023-09-14 14:36:35,747][63732] Conv encoder output size: 512 +[2023-09-14 14:36:35,748][63732] Policy head output size: 640 +[2023-09-14 14:36:36,012][63733] RunningMeanStd input shape: (23,) +[2023-09-14 14:36:36,012][63733] RunningMeanStd input shape: (3, 72, 128) +[2023-09-14 14:36:36,013][63733] RunningMeanStd input shape: (1,) +[2023-09-14 14:36:36,024][63733] ConvEncoder: input_channels=3 +[2023-09-14 14:36:36,126][63733] Conv encoder output size: 512 +[2023-09-14 14:36:36,127][63733] Policy head output size: 640 +[2023-09-14 14:36:36,442][63735] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 14:36:36,444][63735] Port 40300 is available +[2023-09-14 14:36:36,444][63735] Using port 40300 +[2023-09-14 14:36:36,446][63734] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 14:36:36,447][63806] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 14:36:36,447][63769] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 14:36:36,447][63767] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 14:36:36,448][63805] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 14:36:36,448][63734] Port 40400 is available +[2023-09-14 14:36:36,449][63734] Using port 40400 +[2023-09-14 14:36:36,449][63806] UDP port 41000 cannot be used [Errno 98] Address already in use +[2023-09-14 14:36:36,449][63769] Port 40600 is available +[2023-09-14 14:36:36,449][63769] Using port 40600 +[2023-09-14 14:36:36,449][63806] Port 42000 is available +[2023-09-14 14:36:36,449][63806] Using port 42000 +[2023-09-14 14:36:36,449][63767] Port 40500 is available +[2023-09-14 14:36:36,450][63767] Using port 40500 +[2023-09-14 14:36:36,451][63805] Port 40900 is available +[2023-09-14 14:36:36,451][63805] Using port 40900 +[2023-09-14 14:36:36,452][63770] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 14:36:36,455][63770] Port 40700 is available +[2023-09-14 14:36:36,456][63770] Using port 40700 +[2023-09-14 14:36:36,456][63771] Doom resolution: 160x120, resize resolution: (128, 72) +[2023-09-14 14:36:36,459][63771] Port 40800 is available +[2023-09-14 14:36:36,460][63771] Using port 40800 +[2023-09-14 14:36:36,474][63735] Port 40301 is available +[2023-09-14 14:36:36,474][63735] Using port 40301 +[2023-09-14 14:36:36,476][63735] Using port 40300 on host... +[2023-09-14 14:36:36,479][63734] Port 40401 is available +[2023-09-14 14:36:36,479][63806] UDP port 41001 cannot be used [Errno 98] Address already in use +[2023-09-14 14:36:36,479][63734] Using port 40401 +[2023-09-14 14:36:36,479][63806] Port 42001 is available +[2023-09-14 14:36:36,479][63806] Using port 42001 +[2023-09-14 14:36:36,480][63769] Port 40601 is available +[2023-09-14 14:36:36,480][63769] Using port 40601 +[2023-09-14 14:36:36,480][63734] Using port 40400 on host... +[2023-09-14 14:36:36,481][63767] Port 40501 is available +[2023-09-14 14:36:36,481][63806] Using port 42000 on host... +[2023-09-14 14:36:36,481][63767] Using port 40501 +[2023-09-14 14:36:36,482][63769] Using port 40600 on host... +[2023-09-14 14:36:36,482][63805] Port 40901 is available +[2023-09-14 14:36:36,482][63805] Using port 40901 +[2023-09-14 14:36:36,482][63767] Using port 40500 on host... +[2023-09-14 14:36:36,484][63805] Using port 40900 on host... +[2023-09-14 14:36:36,486][63770] Port 40701 is available +[2023-09-14 14:36:36,486][63770] Using port 40701 +[2023-09-14 14:36:36,488][63770] Using port 40700 on host... +[2023-09-14 14:36:36,506][63771] Port 40801 is available +[2023-09-14 14:36:36,507][63771] Using port 40801 +[2023-09-14 14:36:36,509][63771] Using port 40800 on host... +[2023-09-14 14:36:36,770][63806] Initialized w:7 v:0 player:0 +[2023-09-14 14:36:36,772][63806] Decorrelating experience for 0 frames... +[2023-09-14 14:36:36,773][63806] Using port 42001 on host... +[2023-09-14 14:36:36,778][63805] Initialized w:6 v:0 player:0 +[2023-09-14 14:36:36,778][63769] Initialized w:3 v:0 player:0 +[2023-09-14 14:36:36,779][63767] Initialized w:2 v:0 player:0 +[2023-09-14 14:36:36,780][63805] Decorrelating experience for 0 frames... +[2023-09-14 14:36:36,780][63769] Decorrelating experience for 0 frames... +[2023-09-14 14:36:36,781][63767] Decorrelating experience for 0 frames... +[2023-09-14 14:36:36,782][63805] Using port 40901 on host... +[2023-09-14 14:36:36,782][63769] Using port 40601 on host... +[2023-09-14 14:36:36,783][63767] Using port 40501 on host... +[2023-09-14 14:36:36,794][63771] Initialized w:5 v:0 player:0 +[2023-09-14 14:36:36,796][63771] Decorrelating experience for 0 frames... +[2023-09-14 14:36:36,797][63771] Using port 40801 on host... +[2023-09-14 14:36:36,840][63735] Initialized w:0 v:0 player:0 +[2023-09-14 14:36:36,842][63735] Decorrelating experience for 0 frames... +[2023-09-14 14:36:36,843][63735] Using port 40301 on host... +[2023-09-14 14:36:36,845][63734] Initialized w:1 v:0 player:0 +[2023-09-14 14:36:36,847][63734] Decorrelating experience for 0 frames... +[2023-09-14 14:36:36,848][63734] Using port 40401 on host... +[2023-09-14 14:36:36,852][63770] Initialized w:4 v:0 player:0 +[2023-09-14 14:36:36,854][63770] Decorrelating experience for 0 frames... +[2023-09-14 14:36:36,855][63770] Using port 40701 on host... +[2023-09-14 14:36:37,065][63767] Initialized w:2 v:1 player:0 +[2023-09-14 14:36:37,065][63769] Initialized w:3 v:1 player:0 +[2023-09-14 14:36:37,066][63767] Decorrelating experience for 32 frames... +[2023-09-14 14:36:37,067][63769] Decorrelating experience for 32 frames... +[2023-09-14 14:36:37,069][63805] Initialized w:6 v:1 player:0 +[2023-09-14 14:36:37,070][63805] Decorrelating experience for 32 frames... +[2023-09-14 14:36:37,094][63771] Initialized w:5 v:1 player:0 +[2023-09-14 14:36:37,095][63771] Decorrelating experience for 32 frames... +[2023-09-14 14:36:37,095][63806] Initialized w:7 v:1 player:0 +[2023-09-14 14:36:37,097][63806] Decorrelating experience for 32 frames... +[2023-09-14 14:36:37,151][63767] Port 40502 is available +[2023-09-14 14:36:37,151][63767] Using port 40502 +[2023-09-14 14:36:37,162][63805] Port 40902 is available +[2023-09-14 14:36:37,162][63805] Using port 40902 +[2023-09-14 14:36:37,176][63769] Port 40602 is available +[2023-09-14 14:36:37,176][63769] Using port 40602 +[2023-09-14 14:36:37,181][63767] Port 40503 is available +[2023-09-14 14:36:37,181][63767] Using port 40503 +[2023-09-14 14:36:37,183][63767] Using port 40502 on host... +[2023-09-14 14:36:37,183][63771] Port 40802 is available +[2023-09-14 14:36:37,183][63771] Using port 40802 +[2023-09-14 14:36:37,190][63805] Port 40903 is available +[2023-09-14 14:36:37,191][63805] Using port 40903 +[2023-09-14 14:36:37,192][63805] Using port 40902 on host... +[2023-09-14 14:36:37,201][63806] UDP port 41002 cannot be used [Errno 98] Address already in use +[2023-09-14 14:36:37,201][63806] Port 42002 is available +[2023-09-14 14:36:37,201][63806] Using port 42002 +[2023-09-14 14:36:37,212][63771] Port 40803 is available +[2023-09-14 14:36:37,213][63771] Using port 40803 +[2023-09-14 14:36:37,214][63771] Using port 40802 on host... +[2023-09-14 14:36:37,221][63769] Port 40603 is available +[2023-09-14 14:36:37,221][63769] Using port 40603 +[2023-09-14 14:36:37,224][63769] Using port 40602 on host... +[2023-09-14 14:36:37,239][63735] Initialized w:0 v:1 player:0 +[2023-09-14 14:36:37,241][63735] Decorrelating experience for 32 frames... +[2023-09-14 14:36:37,246][63734] Initialized w:1 v:1 player:0 +[2023-09-14 14:36:37,247][63806] Port 41003 is available +[2023-09-14 14:36:37,247][63806] Using port 41003 +[2023-09-14 14:36:37,246][63770] Initialized w:4 v:1 player:0 +[2023-09-14 14:36:37,247][63734] Decorrelating experience for 32 frames... +[2023-09-14 14:36:37,249][63806] Using port 42002 on host... +[2023-09-14 14:36:37,249][63770] Decorrelating experience for 32 frames... +[2023-09-14 14:36:37,331][63735] Port 40302 is available +[2023-09-14 14:36:37,331][63735] Using port 40302 +[2023-09-14 14:36:37,343][63770] Port 40702 is available +[2023-09-14 14:36:37,344][63770] Using port 40702 +[2023-09-14 14:36:37,356][63734] Port 40402 is available +[2023-09-14 14:36:37,357][63734] Using port 40402 +[2023-09-14 14:36:37,360][63735] Port 40303 is available +[2023-09-14 14:36:37,360][63735] Using port 40303 +[2023-09-14 14:36:37,362][63735] Using port 40302 on host... +[2023-09-14 14:36:37,376][63770] Port 40703 is available +[2023-09-14 14:36:37,376][63770] Using port 40703 +[2023-09-14 14:36:37,378][63770] Using port 40702 on host... +[2023-09-14 14:36:37,402][63734] Port 40403 is available +[2023-09-14 14:36:37,402][63734] Using port 40403 +[2023-09-14 14:36:37,404][63734] Using port 40402 on host... +[2023-09-14 14:36:37,479][63805] Initialized w:6 v:2 player:0 +[2023-09-14 14:36:37,480][63805] Decorrelating experience for 64 frames... +[2023-09-14 14:36:37,525][63767] Initialized w:2 v:2 player:0 +[2023-09-14 14:36:37,526][63767] Decorrelating experience for 64 frames... +[2023-09-14 14:36:37,559][63769] Initialized w:3 v:2 player:0 +[2023-09-14 14:36:37,561][63769] Decorrelating experience for 64 frames... +[2023-09-14 14:36:37,594][63805] Using port 40903 on host... +[2023-09-14 14:36:37,625][63767] Using port 40503 on host... +[2023-09-14 14:36:37,669][63806] Initialized w:7 v:2 player:0 +[2023-09-14 14:36:37,670][63806] Decorrelating experience for 64 frames... +[2023-09-14 14:36:37,687][63769] Using port 40603 on host... +[2023-09-14 14:36:37,692][63771] Initialized w:5 v:2 player:0 +[2023-09-14 14:36:37,694][63771] Decorrelating experience for 64 frames... +[2023-09-14 14:36:37,732][63735] Initialized w:0 v:2 player:0 +[2023-09-14 14:36:37,733][63735] Decorrelating experience for 64 frames... +[2023-09-14 14:36:37,784][63806] Using port 41003 on host... +[2023-09-14 14:36:37,804][63771] Using port 40803 on host... +[2023-09-14 14:36:37,828][63770] Initialized w:4 v:2 player:0 +[2023-09-14 14:36:37,830][63770] Decorrelating experience for 64 frames... +[2023-09-14 14:36:37,844][63735] Using port 40303 on host... +[2023-09-14 14:36:37,862][63734] Initialized w:1 v:2 player:0 +[2023-09-14 14:36:37,865][63734] Decorrelating experience for 64 frames... +[2023-09-14 14:36:37,895][63805] Initialized w:6 v:3 player:0 +[2023-09-14 14:36:37,897][63805] Decorrelating experience for 96 frames... +[2023-09-14 14:36:37,899][63767] Initialized w:2 v:3 player:0 +[2023-09-14 14:36:37,900][63767] Decorrelating experience for 96 frames... +[2023-09-14 14:36:37,934][63770] Using port 40703 on host... +[2023-09-14 14:36:37,974][63769] Initialized w:3 v:3 player:0 +[2023-09-14 14:36:37,976][63769] Decorrelating experience for 96 frames... +[2023-09-14 14:36:37,994][63734] Using port 40403 on host... +[2023-09-14 14:36:38,077][63806] Initialized w:7 v:3 player:0 +[2023-09-14 14:36:38,079][63806] Decorrelating experience for 96 frames... +[2023-09-14 14:36:38,101][63771] Initialized w:5 v:3 player:0 +[2023-09-14 14:36:38,103][63771] Decorrelating experience for 96 frames... +[2023-09-14 14:36:38,132][63735] Initialized w:0 v:3 player:0 +[2023-09-14 14:36:38,134][63735] Decorrelating experience for 96 frames... +[2023-09-14 14:36:38,269][63770] Initialized w:4 v:3 player:0 +[2023-09-14 14:36:38,271][63770] Decorrelating experience for 96 frames... +[2023-09-14 14:36:38,386][63734] Initialized w:1 v:3 player:0 +[2023-09-14 14:36:38,387][63734] Decorrelating experience for 96 frames... +[2023-09-14 14:36:39,962][63454] Signal inference workers to stop experience collection... +[2023-09-14 14:36:39,965][63733] InferenceWorker_p1-w0: stopping experience collection +[2023-09-14 14:36:39,969][63732] InferenceWorker_p0-w0: stopping experience collection +[2023-09-14 14:36:42,857][63454] Signal inference workers to resume experience collection... +[2023-09-14 14:36:42,858][63732] InferenceWorker_p0-w0: resuming experience collection +[2023-09-14 14:36:42,858][63733] InferenceWorker_p1-w0: resuming experience collection +[2023-09-14 14:36:45,350][63576] Signal inference workers to stop experience collection... +[2023-09-14 14:36:45,687][63576] Signal inference workers to resume experience collection... +[2023-09-14 14:36:48,781][63732] Updated weights for policy 0, policy_version 10 (0.0700) +[2023-09-14 14:36:52,631][63733] Updated weights for policy 1, policy_version 10 (0.0012) +[2023-09-14 14:36:54,671][63732] Updated weights for policy 0, policy_version 20 (0.0012) +[2023-09-14 14:37:00,489][63732] Updated weights for policy 0, policy_version 30 (0.0013) +[2023-09-14 14:37:02,288][63733] Updated weights for policy 1, policy_version 20 (0.0011) +[2023-09-14 14:37:03,460][63734] DAMAGECOUNT value on done: 10.0 +[2023-09-14 14:37:03,598][63734] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 14:37:03,754][63770] DAMAGECOUNT value on done: 15.0 +[2023-09-14 14:37:03,755][63770] Sum rewards: -8.078, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.156', 'AMMO5': '0.005', 'AMMO2': '0.011', 'weapon4': '0.014', 'HITCOUNT': '0.020', 'weapon5': '0.026', 'DAMAGECOUNT': '0.045', 'ARMOR': '0.048', 'AMMO4': '0.054', 'AMMO3': '0.096', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'WEAPON3': '0.500', 'weapon3': '0.534', 'FRAGCOUNT': '1.000', 'weapon2': '1.026'} +[2023-09-14 14:37:03,781][63734] DAMAGECOUNT value on done: 46.0 +[2023-09-14 14:37:04,094][63770] DAMAGECOUNT value on done: 20.0 +[2023-09-14 14:37:04,095][63770] Sum rewards: -5.467, reward structure: {'DEATHCOUNT': '-6.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.318', 'AMMO5': '0.003', 'AMMO2': '0.003', 'AMMO4': '0.015', 'HITCOUNT': '0.020', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'DAMAGECOUNT': '0.060', 'AMMO3': '0.067', 'WEAPON5': '0.100', 'weapon5': '0.106', 'ARMOR': '0.116', 'weapon4': '0.124', 'WEAPON3': '0.350', 'weapon3': '0.498', 'weapon2': '0.818'} +[2023-09-14 14:37:04,866][63805] DAMAGECOUNT value on done: 35.0 +[2023-09-14 14:37:05,004][63805] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 14:37:05,121][63806] DAMAGECOUNT value on done: 25.0 +[2023-09-14 14:37:05,140][63735] DAMAGECOUNT value on done: 15.0 +[2023-09-14 14:37:05,256][63806] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 14:37:05,257][63805] DAMAGECOUNT value on done: 15.0 +[2023-09-14 14:37:05,281][63735] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 14:37:05,424][63771] DAMAGECOUNT value on done: 35.0 +[2023-09-14 14:37:05,425][63771] Sum rewards: -5.664, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.012', 'AMMO2': '0.000', 'AMMO4': '0.000', 'HITCOUNT': '0.040', 'DAMAGECOUNT': '0.105', 'AMMO3': '0.106', 'WEAPON3': '0.450', 'weapon2': '0.812', 'weapon3': '0.834', 'FRAGCOUNT': '1.000'} +[2023-09-14 14:37:05,523][63806] DAMAGECOUNT value on done: 218.0 +[2023-09-14 14:37:05,523][63806] Sum rewards: -4.069, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.198', 'AMMO2': '0.002', 'AMMO5': '0.003', 'AMMO4': '0.011', 'weapon5': '0.038', 'WEAPON5': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.133', 'DAMAGECOUNT': '0.654', 'WEAPON3': '0.700', 'weapon2': '0.784', 'weapon3': '0.944', 'FRAGCOUNT': '1.000'} +[2023-09-14 14:37:05,574][63771] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 14:37:05,589][63735] DAMAGECOUNT value on done: 15.0 +[2023-09-14 14:37:05,605][63805] DAMAGECOUNT value on done: 150.0 +[2023-09-14 14:37:05,606][63805] Sum rewards: -3.372, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.595', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO4': '0.026', 'ARMOR': '0.028', 'weapon4': '0.074', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.103', 'HITCOUNT': '0.150', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.600', 'weapon3': '0.786', 'weapon2': '0.796', 'FRAGCOUNT': '1.000'} +[2023-09-14 14:37:05,837][63771] DAMAGECOUNT value on done: 5.0 +[2023-09-14 14:37:06,006][63805] DAMAGECOUNT value on done: 40.0 +[2023-09-14 14:37:06,039][63734] DAMAGECOUNT value on done: 15.0 +[2023-09-14 14:37:06,355][63734] DAMAGECOUNT value on done: 7.0 +[2023-09-14 14:37:06,377][63767] DAMAGECOUNT value on done: 85.0 +[2023-09-14 14:37:06,500][63767] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 14:37:06,623][63732] Updated weights for policy 0, policy_version 40 (0.0014) +[2023-09-14 14:37:06,703][63769] DAMAGECOUNT value on done: 173.0 +[2023-09-14 14:37:06,744][63767] DAMAGECOUNT value on done: 65.0 +[2023-09-14 14:37:06,745][63767] Sum rewards: -2.545, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.475', 'AMMO2': '0.006', 'AMMO4': '0.028', 'WEAPON4': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.107', 'ARMOR': '0.116', 'weapon4': '0.168', 'DAMAGECOUNT': '0.195', 'WEAPON3': '0.500', 'weapon3': '0.786', 'weapon2': '0.914', 'FRAGCOUNT': '1.000'} +[2023-09-14 14:37:06,887][63806] DAMAGECOUNT value on done: 175.0 +[2023-09-14 14:37:06,888][63806] Sum rewards: -7.130, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.074', 'AMMO5': '0.003', 'AMMO2': '0.005', 'weapon5': '0.010', 'AMMO4': '0.023', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'weapon4': '0.064', 'HITCOUNT': '0.110', 'AMMO3': '0.186', 'DAMAGECOUNT': '0.525', 'weapon2': '0.600', 'weapon3': '0.628', 'WEAPON3': '0.900', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:37:07,035][63769] DAMAGECOUNT value on done: 25.0 +[2023-09-14 14:37:07,105][63767] DAMAGECOUNT value on done: 10.0 +[2023-09-14 14:37:07,134][63735] DAMAGECOUNT value on done: 50.0 +[2023-09-14 14:37:07,135][63735] Sum rewards: -6.700, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.710', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'HITCOUNT': '0.050', 'ARMOR': '0.060', 'DAMAGECOUNT': '0.150', 'AMMO3': '0.167', 'weapon3': '0.678', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.070'} +[2023-09-14 14:37:07,331][63806] DAMAGECOUNT value on done: 17.0 +[2023-09-14 14:37:07,332][63806] Sum rewards: -9.517, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.022', 'AMMO2': '0.003', 'WEAPON1': '0.010', 'AMMO4': '0.016', 'HITCOUNT': '0.020', 'ARMOR': '0.028', 'WEAPON4': '0.050', 'DAMAGECOUNT': '0.051', 'weapon4': '0.066', 'AMMO3': '0.194', 'weapon3': '0.362', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.054'} +[2023-09-14 14:37:07,378][63771] DAMAGECOUNT value on done: 10.0 +[2023-09-14 14:37:07,379][63771] Sum rewards: -5.850, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '0.002', 'AMMO5': '0.003', 'HITCOUNT': '0.010', 'AMMO2': '0.019', 'weapon5': '0.020', 'DAMAGECOUNT': '0.030', 'ARMOR': '0.041', 'WEAPON5': '0.050', 'AMMO3': '0.081', 'AMMO4': '0.096', 'WEAPON4': '0.150', 'weapon4': '0.178', 'WEAPON3': '0.450', 'weapon3': '0.496', 'weapon2': '0.774'} +[2023-09-14 14:37:07,457][63735] DAMAGECOUNT value on done: 0.0 +[2023-09-14 14:37:07,463][63769] DAMAGECOUNT value on done: 130.0 +[2023-09-14 14:37:07,464][63454] Saving new best policy, reward=-6.331! +[2023-09-14 14:37:07,464][63576] Saving new best policy, reward=-6.765! +[2023-09-14 14:37:07,546][63767] DAMAGECOUNT value on done: 0.0 +[2023-09-14 14:37:07,625][63770] DAMAGECOUNT value on done: 55.0 +[2023-09-14 14:37:07,625][63770] Sum rewards: -7.588, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.196', 'AMMO2': '0.016', 'WEAPON1': '0.020', 'weapon4': '0.026', 'ARMOR': '0.032', 'HITCOUNT': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.077', 'AMMO3': '0.146', 'DAMAGECOUNT': '0.165', 'weapon3': '0.742', 'WEAPON3': '0.800', 'weapon2': '0.984', 'FRAGCOUNT': '1.000'} +[2023-09-14 14:37:07,779][63771] DAMAGECOUNT value on done: 30.0 +[2023-09-14 14:37:07,779][63771] Sum rewards: -5.993, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.352', 'AMMO4': '-0.008', 'AMMO2': '-0.002', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'HITCOUNT': '0.030', 'ARMOR': '0.036', 'DAMAGECOUNT': '0.090', 'AMMO3': '0.115', 'WEAPON3': '0.600', 'weapon3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.032'} +[2023-09-14 14:37:07,802][63770] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 14:37:07,938][63769] DAMAGECOUNT value on done: 55.0 +[2023-09-14 14:37:08,049][63770] DAMAGECOUNT value on done: 90.0 +[2023-09-14 14:37:08,049][63770] Sum rewards: -6.528, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.858', 'weapon5': '0.006', 'AMMO5': '0.007', 'AMMO2': '0.021', 'HITCOUNT': '0.080', 'weapon4': '0.100', 'AMMO4': '0.105', 'AMMO3': '0.132', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.270', 'weapon3': '0.418', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.040'} +[2023-09-14 14:37:08,085][63769] Multiple policies in trajectory buffer: [0 1] (-1 means inactive agent) +[2023-09-14 14:37:09,533][63733] Updated weights for policy 1, policy_version 30 (0.0011) +[2023-09-14 14:37:15,361][63733] Updated weights for policy 1, policy_version 40 (0.0011) +[2023-09-14 14:37:16,143][63732] Updated weights for policy 0, policy_version 50 (0.0011) +[2023-09-14 14:37:19,253][63805] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:37:21,156][63733] Updated weights for policy 1, policy_version 50 (0.0011) +[2023-09-14 14:37:25,759][63732] Updated weights for policy 0, policy_version 60 (0.0011) +[2023-09-14 14:37:26,940][63733] Updated weights for policy 1, policy_version 60 (0.0011) +[2023-09-14 14:37:27,670][63770] DAMAGECOUNT value on done: 20.0 +[2023-09-14 14:37:27,671][63770] Sum rewards: -11.475, reward structure: {'DEATHCOUNT': '-11.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.470', 'AMMO5': '0.003', 'weapon5': '0.006', 'HITCOUNT': '0.010', 'AMMO2': '0.011', 'DAMAGECOUNT': '0.015', 'WEAPON1': '0.020', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.053', 'AMMO3': '0.113', 'weapon4': '0.148', 'weapon3': '0.404', 'WEAPON3': '0.550', 'weapon2': '1.312'} +[2023-09-14 14:37:27,794][63806] DAMAGECOUNT value on done: 25.0 +[2023-09-14 14:37:27,795][63806] Sum rewards: -10.169, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.638', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.003', 'AMMO2': '0.015', 'weapon5': '0.016', 'weapon4': '0.034', 'ARMOR': '0.048', 'WEAPON5': '0.050', 'AMMO4': '0.075', 'WEAPON4': '0.100', 'AMMO3': '0.134', 'weapon3': '0.492', 'WEAPON3': '0.700', 'weapon2': '1.052'} +[2023-09-14 14:37:28,074][63770] DAMAGECOUNT value on done: 20.0 +[2023-09-14 14:37:28,194][63806] DAMAGECOUNT value on done: 343.0 +[2023-09-14 14:37:28,195][63806] Sum rewards: -6.892, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.150', 'AMMO5': '0.007', 'AMMO2': '0.012', 'weapon4': '0.012', 'ARMOR': '0.016', 'WEAPON1': '0.020', 'AMMO4': '0.059', 'HITCOUNT': '0.070', 'AMMO3': '0.099', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.550', 'weapon3': '0.660', 'FRAGCOUNT': '1.000', 'weapon2': '1.128'} +[2023-09-14 14:37:28,618][63805] DAMAGECOUNT value on done: 50.0 +[2023-09-14 14:37:28,665][63734] DAMAGECOUNT value on done: 295.0 +[2023-09-14 14:37:28,792][63734] DAMAGECOUNT value on done: 20.0 +[2023-09-14 14:37:29,002][63805] DAMAGECOUNT value on done: 15.0 +[2023-09-14 14:37:29,052][63734] DAMAGECOUNT value on done: 56.0 +[2023-09-14 14:37:29,111][63735] DAMAGECOUNT value on done: 80.0 +[2023-09-14 14:37:29,144][63734] DAMAGECOUNT value on done: 57.0 +[2023-09-14 14:37:29,317][63771] DAMAGECOUNT value on done: 185.0 +[2023-09-14 14:37:29,318][63771] Sum rewards: -6.046, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.970', 'AMMO5': '0.005', 'AMMO2': '0.005', 'weapon5': '0.006', 'weapon4': '0.014', 'AMMO4': '0.025', 'ARMOR': '0.055', 'HITCOUNT': '0.090', 'AMMO3': '0.095', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.500', 'weapon3': '0.582', 'FRAGCOUNT': '1.000', 'weapon2': '1.146'} +[2023-09-14 14:37:29,576][63735] DAMAGECOUNT value on done: 30.0 +[2023-09-14 14:37:29,669][63806] DAMAGECOUNT value on done: 190.0 +[2023-09-14 14:37:29,752][63735] DAMAGECOUNT value on done: 132.0 +[2023-09-14 14:37:29,752][63735] Sum rewards: -7.148, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.382', 'AMMO2': '0.003', 'AMMO4': '0.016', 'weapon4': '0.038', 'WEAPON4': '0.050', 'HITCOUNT': '0.080', 'AMMO3': '0.154', 'DAMAGECOUNT': '0.351', 'ARMOR': '0.476', 'weapon3': '0.502', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.264'} +[2023-09-14 14:37:29,763][63771] DAMAGECOUNT value on done: 5.0 +[2023-09-14 14:37:30,085][63806] DAMAGECOUNT value on done: 42.0 +[2023-09-14 14:37:30,101][63735] DAMAGECOUNT value on done: 35.0 +[2023-09-14 14:37:30,101][63767] DAMAGECOUNT value on done: 173.0 +[2023-09-14 14:37:30,101][63735] Sum rewards: -8.929, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.084', 'AMMO5': '0.007', 'HITCOUNT': '0.010', 'AMMO2': '0.017', 'WEAPON1': '0.020', 'weapon5': '0.042', 'DAMAGECOUNT': '0.060', 'AMMO4': '0.083', 'AMMO3': '0.094', 'ARMOR': '0.104', 'weapon4': '0.144', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon3': '0.376', 'WEAPON3': '0.500', 'weapon2': '0.898'} +[2023-09-14 14:37:30,180][63771] DAMAGECOUNT value on done: 10.0 +[2023-09-14 14:37:30,416][63767] DAMAGECOUNT value on done: 180.0 +[2023-09-14 14:37:30,417][63767] Sum rewards: -5.813, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.600', 'weapon5': '0.002', 'AMMO2': '0.007', 'ARMOR': '0.012', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.037', 'HITCOUNT': '0.060', 'AMMO3': '0.172', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.345', 'weapon3': '0.714', 'WEAPON3': '0.900', 'weapon2': '1.052', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:37:30,634][63771] DAMAGECOUNT value on done: 190.0 +[2023-09-14 14:37:30,634][63771] Sum rewards: -10.164, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.192', 'ARMOR': '0.020', 'AMMO2': '0.022', 'WEAPON4': '0.100', 'AMMO4': '0.109', 'HITCOUNT': '0.120', 'AMMO3': '0.209', 'DAMAGECOUNT': '0.480', 'weapon3': '0.698', 'weapon2': '0.970', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050'} +[2023-09-14 14:37:30,730][63805] DAMAGECOUNT value on done: 240.0 +[2023-09-14 14:37:30,731][63805] Sum rewards: -9.086, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.516', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.010', 'weapon5': '0.020', 'AMMO2': '0.023', 'weapon4': '0.032', 'ARMOR': '0.040', 'HITCOUNT': '0.090', 'AMMO4': '0.117', 'AMMO3': '0.130', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.700', 'weapon3': '0.714', 'weapon2': '1.184'} +[2023-09-14 14:37:31,059][63805] DAMAGECOUNT value on done: 335.0 +[2023-09-14 14:37:31,060][63805] Sum rewards: -4.074, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.136', 'ARMOR': '0.004', 'AMMO2': '0.016', 'weapon4': '0.032', 'AMMO4': '0.078', 'HITCOUNT': '0.110', 'AMMO3': '0.139', 'WEAPON4': '0.150', 'weapon3': '0.626', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.885', 'weapon2': '1.272', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:37:31,574][63769] DAMAGECOUNT value on done: 135.0 +[2023-09-14 14:37:31,989][63769] DAMAGECOUNT value on done: 65.0 +[2023-09-14 14:37:32,122][63767] DAMAGECOUNT value on done: 70.0 +[2023-09-14 14:37:32,138][63769] DAMAGECOUNT value on done: 254.0 +[2023-09-14 14:37:32,139][63769] Sum rewards: -2.667, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO2': '0.018', 'ARMOR': '0.032', 'HITCOUNT': '0.070', 'AMMO4': '0.087', 'WEAPON4': '0.100', 'weapon4': '0.122', 'AMMO3': '0.125', 'DAMAGECOUNT': '0.243', 'HEALTH': '0.300', 'WEAPON3': '0.650', 'weapon3': '0.890', 'weapon2': '0.946', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:37:32,486][63767] DAMAGECOUNT value on done: 66.0 +[2023-09-14 14:37:32,571][63769] DAMAGECOUNT value on done: 54.0 +[2023-09-14 14:37:32,865][63770] DAMAGECOUNT value on done: 70.0 +[2023-09-14 14:37:33,086][63733] Updated weights for policy 1, policy_version 70 (0.0012) +[2023-09-14 14:37:33,254][63770] DAMAGECOUNT value on done: 140.0 +[2023-09-14 14:37:33,255][63770] Sum rewards: -7.999, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.638', 'AMMO2': '0.020', 'HITCOUNT': '0.050', 'weapon4': '0.062', 'AMMO4': '0.099', 'WEAPON4': '0.100', 'AMMO3': '0.106', 'DAMAGECOUNT': '0.150', 'weapon3': '0.404', 'WEAPON3': '0.450', 'ARMOR': '0.488', 'FRAGCOUNT': '1.000', 'weapon2': '1.210'} +[2023-09-14 14:37:34,909][63732] Updated weights for policy 0, policy_version 70 (0.0012) +[2023-09-14 14:37:39,339][63733] Updated weights for policy 1, policy_version 80 (0.0011) +[2023-09-14 14:37:44,104][63732] Updated weights for policy 0, policy_version 80 (0.0010) +[2023-09-14 14:37:45,714][63733] Updated weights for policy 1, policy_version 90 (0.0013) +[2023-09-14 14:37:51,961][63733] Updated weights for policy 1, policy_version 100 (0.0011) +[2023-09-14 14:37:52,135][63771] DAMAGECOUNT value on done: 220.0 +[2023-09-14 14:37:52,475][63734] DAMAGECOUNT value on done: 335.0 +[2023-09-14 14:37:52,499][63805] DAMAGECOUNT value on done: 60.0 +[2023-09-14 14:37:52,525][63771] DAMAGECOUNT value on done: 42.0 +[2023-09-14 14:37:52,885][63734] DAMAGECOUNT value on done: 106.0 +[2023-09-14 14:37:52,912][63805] DAMAGECOUNT value on done: 85.0 +[2023-09-14 14:37:53,247][63806] DAMAGECOUNT value on done: 106.0 +[2023-09-14 14:37:53,366][63732] Updated weights for policy 0, policy_version 90 (0.0011) +[2023-09-14 14:37:53,471][63770] DAMAGECOUNT value on done: 35.0 +[2023-09-14 14:37:53,546][63767] DAMAGECOUNT value on done: 260.0 +[2023-09-14 14:37:53,630][63806] DAMAGECOUNT value on done: 373.0 +[2023-09-14 14:37:53,714][63771] DAMAGECOUNT value on done: 18.0 +[2023-09-14 14:37:53,828][63770] DAMAGECOUNT value on done: 155.0 +[2023-09-14 14:37:53,828][63770] Sum rewards: -7.221, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.253', 'AMMO5': '0.003', 'weapon5': '0.004', 'AMMO2': '0.024', 'WEAPON5': '0.050', 'ARMOR': '0.076', 'HITCOUNT': '0.080', 'weapon4': '0.106', 'AMMO4': '0.117', 'AMMO3': '0.153', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.405', 'weapon3': '0.558', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.156'} +[2023-09-14 14:37:53,957][63767] DAMAGECOUNT value on done: 225.0 +[2023-09-14 14:37:53,957][63767] Sum rewards: -1.925, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.155', 'AMMO5': '0.007', 'AMMO2': '0.020', 'weapon5': '0.028', 'HITCOUNT': '0.050', 'WEAPON5': '0.050', 'weapon4': '0.070', 'ARMOR': '0.085', 'AMMO4': '0.097', 'AMMO3': '0.121', 'DAMAGECOUNT': '0.135', 'WEAPON4': '0.200', 'weapon3': '0.546', 'WEAPON3': '0.650', 'weapon2': '1.170', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:37:54,094][63771] DAMAGECOUNT value on done: 217.0 +[2023-09-14 14:37:54,286][63734] DAMAGECOUNT value on done: 35.0 +[2023-09-14 14:37:54,761][63735] DAMAGECOUNT value on done: 100.0 +[2023-09-14 14:37:54,773][63734] DAMAGECOUNT value on done: 162.0 +[2023-09-14 14:37:54,774][63734] Sum rewards: -6.917, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.010', 'AMMO2': '0.020', 'ARMOR': '0.024', 'WEAPON1': '0.030', 'weapon4': '0.032', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.102', 'AMMO3': '0.124', 'DAMAGECOUNT': '0.315', 'weapon3': '0.606', 'WEAPON3': '0.650', 'weapon2': '1.240', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:37:54,820][63767] DAMAGECOUNT value on done: 155.0 +[2023-09-14 14:37:54,821][63767] Sum rewards: -5.440, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.668', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'ARMOR': '0.052', 'HITCOUNT': '0.060', 'AMMO3': '0.135', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.550', 'weapon3': '0.706', 'weapon2': '0.992', 'FRAGCOUNT': '1.000'} +[2023-09-14 14:37:55,127][63735] DAMAGECOUNT value on done: 107.0 +[2023-09-14 14:37:55,128][63735] Sum rewards: -6.089, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.822', 'AMMO2': '0.013', 'HITCOUNT': '0.060', 'AMMO4': '0.062', 'WEAPON4': '0.100', 'AMMO3': '0.107', 'weapon4': '0.124', 'DAMAGECOUNT': '0.231', 'weapon3': '0.398', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon2': '1.188'} +[2023-09-14 14:37:55,178][63806] DAMAGECOUNT value on done: 270.0 +[2023-09-14 14:37:55,214][63767] DAMAGECOUNT value on done: 71.0 +[2023-09-14 14:37:55,246][63735] DAMAGECOUNT value on done: 132.0 +[2023-09-14 14:37:55,535][63806] DAMAGECOUNT value on done: 56.0 +[2023-09-14 14:37:55,628][63735] DAMAGECOUNT value on done: 200.0 +[2023-09-14 14:37:55,628][63735] Sum rewards: -6.599, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.222', 'AMMO2': '0.001', 'AMMO5': '0.003', 'AMMO4': '0.006', 'WEAPON5': '0.050', 'ARMOR': '0.080', 'HITCOUNT': '0.080', 'AMMO3': '0.182', 'DAMAGECOUNT': '0.495', 'weapon3': '0.872', 'WEAPON3': '0.950', 'weapon2': '1.154', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:37:56,178][63769] DAMAGECOUNT value on done: 339.0 +[2023-09-14 14:37:56,339][63805] DAMAGECOUNT value on done: 265.0 +[2023-09-14 14:37:56,340][63805] Sum rewards: -8.041, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.003', 'AMMO2': '0.014', 'HITCOUNT': '0.020', 'weapon5': '0.032', 'WEAPON5': '0.050', 'AMMO4': '0.072', 'DAMAGECOUNT': '0.075', 'ARMOR': '0.088', 'weapon4': '0.090', 'AMMO3': '0.128', 'WEAPON4': '0.150', 'weapon3': '0.370', 'HEALTH': '0.463', 'WEAPON3': '0.600', 'weapon2': '1.054'} +[2023-09-14 14:37:56,589][63769] DAMAGECOUNT value on done: 89.0 +[2023-09-14 14:37:56,654][63805] DAMAGECOUNT value on done: 340.0 +[2023-09-14 14:37:57,376][63769] DAMAGECOUNT value on done: 269.0 +[2023-09-14 14:37:57,422][63771] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:37:57,762][63769] DAMAGECOUNT value on done: 90.0 +[2023-09-14 14:37:58,745][63770] DAMAGECOUNT value on done: 115.0 +[2023-09-14 14:37:58,997][63733] Updated weights for policy 1, policy_version 110 (0.0012) +[2023-09-14 14:37:59,116][63770] DAMAGECOUNT value on done: 245.0 +[2023-09-14 14:37:59,116][63770] Sum rewards: -6.528, reward structure: {'DEATHCOUNT': '-10.500', 'AMMO5': '0.003', 'AMMO2': '0.015', 'weapon5': '0.024', 'HEALTH': '0.042', 'WEAPON5': '0.050', 'weapon4': '0.054', 'HITCOUNT': '0.060', 'AMMO4': '0.073', 'ARMOR': '0.076', 'WEAPON4': '0.100', 'AMMO3': '0.107', 'DAMAGECOUNT': '0.315', 'weapon3': '0.402', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon2': '1.152'} +[2023-09-14 14:38:00,800][63732] Updated weights for policy 0, policy_version 100 (0.0012) +[2023-09-14 14:38:06,215][63733] Updated weights for policy 1, policy_version 120 (0.0010) +[2023-09-14 14:38:08,040][63732] Updated weights for policy 0, policy_version 110 (0.0011) +[2023-09-14 14:38:13,497][63733] Updated weights for policy 1, policy_version 130 (0.0010) +[2023-09-14 14:38:15,314][63732] Updated weights for policy 0, policy_version 120 (0.0013) +[2023-09-14 14:38:15,812][63734] DAMAGECOUNT value on done: 425.0 +[2023-09-14 14:38:16,035][63805] DAMAGECOUNT value on done: 150.0 +[2023-09-14 14:38:16,036][63805] Sum rewards: -6.780, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.430', 'ARMOR': '0.004', 'AMMO2': '0.020', 'HITCOUNT': '0.070', 'AMMO4': '0.101', 'AMMO3': '0.134', 'WEAPON4': '0.150', 'weapon4': '0.152', 'DAMAGECOUNT': '0.270', 'weapon3': '0.672', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.126'} +[2023-09-14 14:38:16,195][63734] DAMAGECOUNT value on done: 116.0 +[2023-09-14 14:38:16,421][63805] DAMAGECOUNT value on done: 186.0 +[2023-09-14 14:38:16,865][63735] DAMAGECOUNT value on done: 125.0 +[2023-09-14 14:38:17,203][63771] DAMAGECOUNT value on done: 53.0 +[2023-09-14 14:38:17,204][63771] Sum rewards: -6.894, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.376', 'AMMO5': '0.005', 'ARMOR': '0.008', 'AMMO2': '0.009', 'HITCOUNT': '0.030', 'AMMO4': '0.044', 'weapon5': '0.054', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.105', 'AMMO3': '0.143', 'WEAPON3': '0.750', 'weapon3': '0.794', 'FRAGCOUNT': '1.000', 'weapon2': '1.090'} +[2023-09-14 14:38:17,254][63735] DAMAGECOUNT value on done: 156.0 +[2023-09-14 14:38:17,365][63735] DAMAGECOUNT value on done: 202.0 +[2023-09-14 14:38:17,541][63771] DAMAGECOUNT value on done: 217.0 +[2023-09-14 14:38:17,572][63734] DAMAGECOUNT value on done: 65.0 +[2023-09-14 14:38:17,711][63771] DAMAGECOUNT value on done: 399.0 +[2023-09-14 14:38:17,712][63771] Sum rewards: -2.728, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.346', 'weapon5': '0.002', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'AMMO4': '0.053', 'AMMO3': '0.066', 'WEAPON4': '0.100', 'HITCOUNT': '0.150', 'weapon4': '0.172', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.537', 'weapon3': '0.726', 'FRAGCOUNT': '1.000', 'weapon2': '1.096'} +[2023-09-14 14:38:17,736][63735] DAMAGECOUNT value on done: 250.0 +[2023-09-14 14:38:17,737][63735] Sum rewards: -7.699, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.351', 'AMMO2': '0.003', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO4': '0.014', 'HITCOUNT': '0.050', 'weapon5': '0.054', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.150', 'AMMO3': '0.161', 'WEAPON3': '0.750', 'weapon3': '0.788', 'weapon2': '1.064'} +[2023-09-14 14:38:17,802][63806] DAMAGECOUNT value on done: 365.0 +[2023-09-14 14:38:17,802][63806] Sum rewards: -5.291, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.145', 'AMMO2': '0.004', 'AMMO5': '0.005', 'AMMO4': '0.021', 'weapon4': '0.042', 'HITCOUNT': '0.050', 'AMMO3': '0.091', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.285', 'ARMOR': '0.445', 'WEAPON3': '0.450', 'weapon3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.060'} +[2023-09-14 14:38:17,899][63734] DAMAGECOUNT value on done: 177.0 +[2023-09-14 14:38:17,899][63734] Sum rewards: -8.221, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.176', 'AMMO5': '0.003', 'weapon4': '0.006', 'HITCOUNT': '0.010', 'weapon5': '0.010', 'AMMO2': '0.015', 'DAMAGECOUNT': '0.045', 'WEAPON5': '0.050', 'AMMO4': '0.073', 'WEAPON4': '0.100', 'AMMO3': '0.121', 'ARMOR': '0.478', 'WEAPON3': '0.650', 'weapon3': '0.814', 'weapon2': '1.080'} +[2023-09-14 14:38:18,045][63771] DAMAGECOUNT value on done: 249.0 +[2023-09-14 14:38:18,045][63771] Sum rewards: -4.517, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.964', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'AMMO2': '0.012', 'weapon5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.058', 'WEAPON5': '0.100', 'AMMO3': '0.106', 'weapon4': '0.122', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.621', 'weapon3': '0.778', 'weapon2': '0.950'} +[2023-09-14 14:38:18,099][63806] DAMAGECOUNT value on done: 141.0 +[2023-09-14 14:38:18,099][63806] Sum rewards: -7.399, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.285', 'AMMO2': '0.003', 'AMMO5': '0.005', 'weapon4': '0.008', 'AMMO4': '0.014', 'weapon5': '0.020', 'HITCOUNT': '0.030', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.105', 'AMMO3': '0.136', 'ARMOR': '0.443', 'WEAPON3': '0.600', 'weapon3': '0.822', 'FRAGCOUNT': '1.000', 'weapon2': '1.050'} +[2023-09-14 14:38:18,141][63806] DAMAGECOUNT value on done: 126.0 +[2023-09-14 14:38:18,191][63767] DAMAGECOUNT value on done: 210.0 +[2023-09-14 14:38:18,513][63767] DAMAGECOUNT value on done: 103.0 +[2023-09-14 14:38:18,514][63767] Sum rewards: -11.440, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-3.000', 'HEALTH': '-1.920', 'AMMO5': '0.009', 'HITCOUNT': '0.030', 'AMMO2': '0.031', 'weapon5': '0.036', 'DAMAGECOUNT': '0.096', 'ARMOR': '0.100', 'AMMO3': '0.127', 'AMMO4': '0.153', 'weapon4': '0.188', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'weapon3': '0.280', 'WEAPON3': '0.550', 'weapon2': '1.180'} +[2023-09-14 14:38:18,538][63806] DAMAGECOUNT value on done: 408.0 +[2023-09-14 14:38:18,952][63770] DAMAGECOUNT value on done: 91.0 +[2023-09-14 14:38:19,018][63767] DAMAGECOUNT value on done: 260.0 +[2023-09-14 14:38:19,308][63770] DAMAGECOUNT value on done: 175.0 +[2023-09-14 14:38:19,345][63767] DAMAGECOUNT value on done: 254.0 +[2023-09-14 14:38:19,345][63767] Sum rewards: -5.554, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.903', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.008', 'AMMO2': '0.013', 'HITCOUNT': '0.020', 'weapon5': '0.022', 'ARMOR': '0.040', 'AMMO3': '0.049', 'AMMO4': '0.066', 'weapon4': '0.076', 'DAMAGECOUNT': '0.087', 'WEAPON5': '0.100', 'weapon3': '0.182', 'WEAPON4': '0.200', 'WEAPON3': '0.250', 'weapon2': '1.486'} +[2023-09-14 14:38:19,459][63769] DAMAGECOUNT value on done: 379.0 +[2023-09-14 14:38:19,459][63769] Sum rewards: -7.474, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.610', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.007', 'AMMO2': '0.028', 'weapon5': '0.032', 'ARMOR': '0.040', 'HITCOUNT': '0.040', 'AMMO3': '0.093', 'DAMAGECOUNT': '0.120', 'AMMO4': '0.141', 'WEAPON5': '0.150', 'weapon4': '0.174', 'WEAPON4': '0.350', 'weapon3': '0.386', 'WEAPON3': '0.500', 'weapon2': '1.074'} +[2023-09-14 14:38:19,833][63769] DAMAGECOUNT value on done: 109.0 +[2023-09-14 14:38:20,212][63733] Updated weights for policy 1, policy_version 140 (0.0010) +[2023-09-14 14:38:21,724][63805] DAMAGECOUNT value on done: 335.0 +[2023-09-14 14:38:21,725][63805] Sum rewards: -6.938, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.762', 'AMMO2': '0.009', 'WEAPON1': '0.020', 'AMMO4': '0.043', 'WEAPON4': '0.050', 'ARMOR': '0.086', 'HITCOUNT': '0.110', 'AMMO3': '0.184', 'DAMAGECOUNT': '0.210', 'weapon3': '0.832', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.030'} +[2023-09-14 14:38:22,081][63805] DAMAGECOUNT value on done: 507.0 +[2023-09-14 14:38:22,082][63805] Sum rewards: -7.504, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.364', 'AMMO5': '0.005', 'AMMO2': '0.015', 'weapon4': '0.058', 'AMMO4': '0.077', 'WEAPON5': '0.100', 'HITCOUNT': '0.140', 'WEAPON4': '0.150', 'AMMO3': '0.174', 'DAMAGECOUNT': '0.501', 'weapon3': '0.746', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.344'} +[2023-09-14 14:38:22,117][63770] DAMAGECOUNT value on done: 115.0 +[2023-09-14 14:38:22,503][63770] DAMAGECOUNT value on done: 255.0 +[2023-09-14 14:38:22,689][63769] DAMAGECOUNT value on done: 284.0 +[2023-09-14 14:38:23,040][63769] DAMAGECOUNT value on done: 120.0 +[2023-09-14 14:38:23,041][63769] Sum rewards: -7.067, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.203', 'AMMO5': '0.003', 'AMMO2': '0.017', 'HITCOUNT': '0.020', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'WEAPON5': '0.050', 'weapon5': '0.052', 'AMMO3': '0.065', 'AMMO4': '0.087', 'DAMAGECOUNT': '0.090', 'weapon4': '0.114', 'WEAPON4': '0.150', 'weapon3': '0.258', 'WEAPON3': '0.300', 'weapon2': '1.374'} +[2023-09-14 14:38:23,325][63732] Updated weights for policy 0, policy_version 130 (0.0011) +[2023-09-14 14:38:26,236][63733] Updated weights for policy 1, policy_version 150 (0.0013) +[2023-09-14 14:38:27,465][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000151_618496.pth... +[2023-09-14 14:38:27,465][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000134_548864.pth... +[2023-09-14 14:38:27,527][63576] Saving new best policy, reward=-6.755! +[2023-09-14 14:38:32,523][63732] Updated weights for policy 0, policy_version 140 (0.0010) +[2023-09-14 14:38:32,773][63733] Updated weights for policy 1, policy_version 160 (0.0012) +[2023-09-14 14:38:39,026][63733] Updated weights for policy 1, policy_version 170 (0.0010) +[2023-09-14 14:38:39,836][63734] DAMAGECOUNT value on done: 560.0 +[2023-09-14 14:38:39,837][63734] Sum rewards: -5.073, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.735', 'AMMO5': '0.005', 'AMMO2': '0.014', 'AMMO4': '0.071', 'weapon4': '0.096', 'HITCOUNT': '0.120', 'AMMO3': '0.129', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.750', 'weapon3': '0.872', 'weapon2': '1.300', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:38:39,985][63735] DAMAGECOUNT value on done: 140.0 +[2023-09-14 14:38:40,127][63805] DAMAGECOUNT value on done: 250.0 +[2023-09-14 14:38:40,190][63734] DAMAGECOUNT value on done: 156.0 +[2023-09-14 14:38:40,266][63735] DAMAGECOUNT value on done: 170.0 +[2023-09-14 14:38:40,497][63805] DAMAGECOUNT value on done: 211.0 +[2023-09-14 14:38:40,787][63767] DAMAGECOUNT value on done: 278.0 +[2023-09-14 14:38:41,136][63767] DAMAGECOUNT value on done: 337.0 +[2023-09-14 14:38:41,136][63767] Sum rewards: -5.157, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.267', 'weapon4': '0.008', 'AMMO2': '0.010', 'AMMO4': '0.052', 'AMMO3': '0.076', 'ARMOR': '0.076', 'WEAPON4': '0.100', 'HITCOUNT': '0.180', 'WEAPON3': '0.400', 'weapon3': '0.680', 'DAMAGECOUNT': '0.702', 'weapon2': '1.326', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:38:41,408][63771] DAMAGECOUNT value on done: 183.0 +[2023-09-14 14:38:41,408][63771] Sum rewards: -5.230, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.572', 'AMMO2': '0.015', 'weapon7': '0.060', 'AMMO4': '0.077', 'HITCOUNT': '0.090', 'AMMO3': '0.144', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.256', 'DAMAGECOUNT': '0.390', 'weapon3': '0.706', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.084'} +[2023-09-14 14:38:41,529][63732] Updated weights for policy 0, policy_version 150 (0.0011) +[2023-09-14 14:38:41,745][63771] DAMAGECOUNT value on done: 222.0 +[2023-09-14 14:38:42,349][63735] DAMAGECOUNT value on done: 327.0 +[2023-09-14 14:38:42,350][63735] Sum rewards: -3.193, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.058', 'AMMO2': '0.021', 'ARMOR': '0.055', 'HITCOUNT': '0.080', 'AMMO3': '0.095', 'AMMO4': '0.107', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.550', 'weapon3': '0.994', 'FRAGCOUNT': '1.000', 'weapon2': '1.138'} +[2023-09-14 14:38:42,397][63767] DAMAGECOUNT value on done: 295.0 +[2023-09-14 14:38:42,397][63767] Sum rewards: -8.105, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.283', 'AMMO5': '0.005', 'AMMO2': '0.013', 'HITCOUNT': '0.030', 'ARMOR': '0.036', 'weapon4': '0.042', 'AMMO4': '0.063', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.105', 'WEAPON4': '0.150', 'AMMO3': '0.160', 'WEAPON3': '0.900', 'weapon3': '0.976', 'FRAGCOUNT': '1.000', 'weapon2': '1.098'} +[2023-09-14 14:38:42,461][63576] Saving new best policy, reward=-6.679! +[2023-09-14 14:38:42,741][63806] DAMAGECOUNT value on done: 365.0 +[2023-09-14 14:38:42,748][63735] DAMAGECOUNT value on done: 268.0 +[2023-09-14 14:38:42,759][63767] DAMAGECOUNT value on done: 263.0 +[2023-09-14 14:38:42,927][63734] DAMAGECOUNT value on done: 135.0 +[2023-09-14 14:38:43,030][63806] DAMAGECOUNT value on done: 241.0 +[2023-09-14 14:38:43,031][63806] Sum rewards: -8.499, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.934', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.016', 'HITCOUNT': '0.060', 'ARMOR': '0.068', 'AMMO4': '0.078', 'WEAPON5': '0.100', 'weapon4': '0.170', 'AMMO3': '0.175', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.300', 'weapon3': '0.576', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.028'} +[2023-09-14 14:38:43,076][63806] DAMAGECOUNT value on done: 136.0 +[2023-09-14 14:38:43,287][63769] DAMAGECOUNT value on done: 429.0 +[2023-09-14 14:38:43,368][63734] DAMAGECOUNT value on done: 177.0 +[2023-09-14 14:38:43,398][63771] DAMAGECOUNT value on done: 418.0 +[2023-09-14 14:38:43,399][63771] Sum rewards: -8.294, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.411', 'AMMO2': '0.008', 'weapon4': '0.012', 'HITCOUNT': '0.030', 'ARMOR': '0.040', 'AMMO4': '0.041', 'DAMAGECOUNT': '0.057', 'WEAPON4': '0.100', 'AMMO3': '0.121', 'WEAPON3': '0.650', 'weapon3': '0.692', 'FRAGCOUNT': '1.000', 'weapon2': '1.116'} +[2023-09-14 14:38:43,483][63806] DAMAGECOUNT value on done: 428.0 +[2023-09-14 14:38:43,620][63769] DAMAGECOUNT value on done: 174.0 +[2023-09-14 14:38:43,741][63771] DAMAGECOUNT value on done: 313.0 +[2023-09-14 14:38:43,741][63771] Sum rewards: -7.338, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.518', 'AMMO2': '0.008', 'AMMO4': '0.037', 'HITCOUNT': '0.060', 'ARMOR': '0.064', 'WEAPON4': '0.100', 'weapon4': '0.166', 'AMMO3': '0.185', 'DAMAGECOUNT': '0.192', 'weapon3': '0.712', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.206'} +[2023-09-14 14:38:44,404][63770] DAMAGECOUNT value on done: 91.0 +[2023-09-14 14:38:44,812][63770] DAMAGECOUNT value on done: 226.0 +[2023-09-14 14:38:44,813][63770] Sum rewards: -7.279, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.290', 'AMMO2': '0.009', 'ARMOR': '0.020', 'AMMO4': '0.045', 'weapon4': '0.048', 'HITCOUNT': '0.070', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.153', 'AMMO3': '0.174', 'weapon3': '0.708', 'WEAPON3': '0.950', 'weapon2': '1.234', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:38:45,134][63733] Updated weights for policy 1, policy_version 180 (0.0011) +[2023-09-14 14:38:45,268][63770] DAMAGECOUNT value on done: 205.0 +[2023-09-14 14:38:45,268][63770] Sum rewards: -5.193, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.750', 'AMMO2': '0.015', 'HITCOUNT': '0.060', 'ARMOR': '0.064', 'AMMO4': '0.074', 'AMMO3': '0.110', 'weapon4': '0.146', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.270', 'weapon3': '0.452', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.066'} +[2023-09-14 14:38:45,603][63770] DAMAGECOUNT value on done: 315.0 +[2023-09-14 14:38:45,603][63770] Sum rewards: -6.227, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.982', 'AMMO2': '0.002', 'AMMO5': '0.009', 'AMMO4': '0.011', 'weapon5': '0.016', 'WEAPON4': '0.050', 'ARMOR': '0.056', 'HITCOUNT': '0.060', 'weapon4': '0.092', 'WEAPON5': '0.100', 'AMMO3': '0.110', 'DAMAGECOUNT': '0.180', 'WEAPON3': '0.550', 'weapon3': '0.796', 'weapon2': '0.972'} +[2023-09-14 14:38:46,294][63769] DAMAGECOUNT value on done: 389.0 +[2023-09-14 14:38:46,294][63769] Sum rewards: -8.171, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.620', 'weapon5': '0.008', 'AMMO2': '0.011', 'AMMO5': '0.015', 'AMMO4': '0.054', 'weapon4': '0.056', 'HITCOUNT': '0.090', 'WEAPON4': '0.150', 'AMMO3': '0.160', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.900', 'weapon3': '0.914', 'FRAGCOUNT': '1.000', 'weapon2': '1.076'} +[2023-09-14 14:38:46,638][63769] DAMAGECOUNT value on done: 145.0 +[2023-09-14 14:38:47,173][63805] DAMAGECOUNT value on done: 380.0 +[2023-09-14 14:38:47,174][63805] Sum rewards: -6.813, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.328', 'AMMO5': '0.013', 'AMMO2': '0.017', 'weapon5': '0.026', 'HITCOUNT': '0.050', 'AMMO4': '0.086', 'AMMO3': '0.087', 'DAMAGECOUNT': '0.135', 'WEAPON4': '0.150', 'weapon4': '0.162', 'WEAPON5': '0.200', 'weapon3': '0.372', 'WEAPON3': '0.450', 'ARMOR': '0.525', 'FRAGCOUNT': '1.000', 'weapon2': '1.492'} +[2023-09-14 14:38:47,608][63805] DAMAGECOUNT value on done: 507.0 +[2023-09-14 14:38:50,283][63732] Updated weights for policy 0, policy_version 160 (0.0010) +[2023-09-14 14:38:51,268][63733] Updated weights for policy 1, policy_version 190 (0.0010) +[2023-09-14 14:38:57,304][63733] Updated weights for policy 1, policy_version 200 (0.0010) +[2023-09-14 14:38:59,126][63732] Updated weights for policy 0, policy_version 170 (0.0010) +[2023-09-14 14:39:01,953][63735] DAMAGECOUNT value on done: 305.0 +[2023-09-14 14:39:01,954][63735] Sum rewards: -8.183, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.139', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.003', 'AMMO2': '0.019', 'ARMOR': '0.034', 'weapon5': '0.042', 'WEAPON5': '0.050', 'weapon4': '0.086', 'AMMO4': '0.093', 'HITCOUNT': '0.140', 'AMMO3': '0.150', 'WEAPON4': '0.150', 'weapon3': '0.446', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.650', 'weapon2': '1.598'} +[2023-09-14 14:39:02,306][63735] DAMAGECOUNT value on done: 225.0 +[2023-09-14 14:39:02,896][63767] DAMAGECOUNT value on done: 293.0 +[2023-09-14 14:39:03,214][63767] DAMAGECOUNT value on done: 389.0 +[2023-09-14 14:39:03,306][63734] DAMAGECOUNT value on done: 630.0 +[2023-09-14 14:39:03,399][63733] Updated weights for policy 1, policy_version 210 (0.0010) +[2023-09-14 14:39:03,407][63805] DAMAGECOUNT value on done: 262.0 +[2023-09-14 14:39:03,678][63734] DAMAGECOUNT value on done: 170.0 +[2023-09-14 14:39:03,726][63805] DAMAGECOUNT value on done: 271.0 +[2023-09-14 14:39:04,939][63771] DAMAGECOUNT value on done: 188.0 +[2023-09-14 14:39:05,275][63767] DAMAGECOUNT value on done: 371.0 +[2023-09-14 14:39:05,276][63767] Sum rewards: -6.189, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.010', 'FRAGCOUNT': '-0.500', 'ARMOR': '0.004', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.023', 'weapon5': '0.032', 'HITCOUNT': '0.080', 'AMMO3': '0.093', 'AMMO4': '0.113', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.228', 'WEAPON4': '0.250', 'weapon4': '0.368', 'WEAPON3': '0.500', 'weapon3': '0.654', 'weapon2': '1.054'} +[2023-09-14 14:39:05,323][63771] DAMAGECOUNT value on done: 322.0 +[2023-09-14 14:39:05,323][63771] Sum rewards: -8.277, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.605', 'FRAGCOUNT': '-1.500', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'AMMO5': '0.003', 'ARMOR': '0.008', 'weapon5': '0.030', 'WEAPON5': '0.050', 'HITCOUNT': '0.080', 'AMMO3': '0.144', 'DAMAGECOUNT': '0.300', 'weapon3': '0.678', 'WEAPON3': '0.700', 'weapon2': '1.094'} +[2023-09-14 14:39:05,618][63767] DAMAGECOUNT value on done: 348.0 +[2023-09-14 14:39:05,619][63767] Sum rewards: -4.488, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.822', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO4': '0.025', 'AMMO3': '0.050', 'WEAPON5': '0.050', 'ARMOR': '0.072', 'HITCOUNT': '0.080', 'WEAPON3': '0.250', 'DAMAGECOUNT': '0.255', 'weapon3': '0.636', 'FRAGCOUNT': '1.000', 'weapon2': '1.408'} +[2023-09-14 14:39:06,464][63769] DAMAGECOUNT value on done: 494.0 +[2023-09-14 14:39:06,464][63769] Sum rewards: -2.672, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.505', 'AMMO2': '0.005', 'weapon4': '0.006', 'AMMO4': '0.025', 'ARMOR': '0.040', 'HITCOUNT': '0.050', 'WEAPON4': '0.050', 'AMMO3': '0.099', 'DAMAGECOUNT': '0.195', 'weapon3': '0.408', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon2': '1.504'} +[2023-09-14 14:39:06,694][63735] DAMAGECOUNT value on done: 337.0 +[2023-09-14 14:39:06,785][63769] DAMAGECOUNT value on done: 209.0 +[2023-09-14 14:39:07,092][63735] DAMAGECOUNT value on done: 323.0 +[2023-09-14 14:39:07,223][63806] DAMAGECOUNT value on done: 430.0 +[2023-09-14 14:39:07,517][63806] DAMAGECOUNT value on done: 397.0 +[2023-09-14 14:39:07,517][63806] Sum rewards: -2.603, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.084', 'weapon4': '0.004', 'AMMO2': '0.017', 'HITCOUNT': '0.050', 'ARMOR': '0.056', 'AMMO4': '0.085', 'weapon7': '0.086', 'AMMO3': '0.113', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.150', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.468', 'WEAPON3': '0.600', 'weapon2': '0.910', 'FRAGCOUNT': '1.000', 'weapon3': '1.002'} +[2023-09-14 14:39:07,563][63806] DAMAGECOUNT value on done: 251.0 +[2023-09-14 14:39:07,564][63806] Sum rewards: -6.511, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.510', 'AMMO2': '0.003', 'AMMO5': '0.005', 'AMMO4': '0.013', 'HITCOUNT': '0.070', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.106', 'AMMO3': '0.129', 'DAMAGECOUNT': '0.345', 'ARMOR': '0.498', 'WEAPON3': '0.650', 'weapon3': '0.902', 'FRAGCOUNT': '1.000', 'weapon2': '1.078'} +[2023-09-14 14:39:07,733][63770] DAMAGECOUNT value on done: 205.0 +[2023-09-14 14:39:07,916][63732] Updated weights for policy 0, policy_version 180 (0.0012) +[2023-09-14 14:39:07,947][63734] DAMAGECOUNT value on done: 270.0 +[2023-09-14 14:39:07,957][63806] DAMAGECOUNT value on done: 563.0 +[2023-09-14 14:39:07,958][63806] Sum rewards: -4.806, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.602', 'weapon5': '0.006', 'AMMO5': '0.013', 'AMMO2': '0.023', 'HITCOUNT': '0.090', 'AMMO4': '0.116', 'AMMO3': '0.161', 'weapon4': '0.206', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.405', 'ARMOR': '0.436', 'WEAPON3': '0.800', 'weapon3': '0.800', 'weapon2': '0.940', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:39:08,129][63770] DAMAGECOUNT value on done: 320.0 +[2023-09-14 14:39:08,129][63770] Sum rewards: -5.319, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.232', 'HITCOUNT': '0.010', 'DAMAGECOUNT': '0.015', 'AMMO2': '0.019', 'ARMOR': '0.044', 'AMMO4': '0.095', 'AMMO3': '0.131', 'weapon4': '0.172', 'WEAPON4': '0.250', 'WEAPON3': '0.600', 'weapon3': '0.624', 'FRAGCOUNT': '1.000', 'weapon2': '1.202'} +[2023-09-14 14:39:08,348][63734] DAMAGECOUNT value on done: 227.0 +[2023-09-14 14:39:08,348][63734] Sum rewards: -3.605, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.098', 'AMMO5': '0.003', 'weapon5': '0.014', 'AMMO2': '0.019', 'HITCOUNT': '0.050', 'WEAPON5': '0.050', 'ARMOR': '0.072', 'AMMO3': '0.081', 'AMMO4': '0.096', 'DAMAGECOUNT': '0.150', 'WEAPON4': '0.200', 'weapon4': '0.268', 'WEAPON3': '0.400', 'weapon3': '0.736', 'weapon2': '0.854', 'FRAGCOUNT': '1.000'} +[2023-09-14 14:39:08,441][63771] DAMAGECOUNT value on done: 443.0 +[2023-09-14 14:39:08,820][63771] DAMAGECOUNT value on done: 328.0 +[2023-09-14 14:39:09,302][63770] DAMAGECOUNT value on done: 121.0 +[2023-09-14 14:39:09,472][63769] DAMAGECOUNT value on done: 434.0 +[2023-09-14 14:39:09,564][63733] Updated weights for policy 1, policy_version 220 (0.0011) +[2023-09-14 14:39:09,698][63770] DAMAGECOUNT value on done: 333.0 +[2023-09-14 14:39:09,893][63769] DAMAGECOUNT value on done: 170.0 +[2023-09-14 14:39:11,945][63805] DAMAGECOUNT value on done: 380.0 +[2023-09-14 14:39:12,346][63805] DAMAGECOUNT value on done: 552.0 +[2023-09-14 14:39:12,461][63576] Saving new best policy, reward=-6.626! +[2023-09-14 14:39:15,734][63733] Updated weights for policy 1, policy_version 230 (0.0011) +[2023-09-14 14:39:16,870][63732] Updated weights for policy 0, policy_version 190 (0.0010) +[2023-09-14 14:39:21,814][63733] Updated weights for policy 1, policy_version 240 (0.0011) +[2023-09-14 14:39:23,971][63735] DAMAGECOUNT value on done: 380.0 +[2023-09-14 14:39:24,319][63735] DAMAGECOUNT value on done: 272.0 +[2023-09-14 14:39:25,167][63771] Large shaping reward -2.534 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.28500000000000003, -95.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:39:25,180][63767] DAMAGECOUNT value on done: 352.0 +[2023-09-14 14:39:25,181][63767] Sum rewards: -2.168, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.642', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'HITCOUNT': '0.060', 'AMMO3': '0.120', 'DAMAGECOUNT': '0.177', 'ARMOR': '0.420', 'WEAPON3': '0.600', 'weapon3': '0.902', 'FRAGCOUNT': '1.000', 'weapon2': '1.196'} +[2023-09-14 14:39:25,509][63767] DAMAGECOUNT value on done: 532.0 +[2023-09-14 14:39:25,510][63767] Sum rewards: -9.286, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.160', 'AMMO2': '0.016', 'ARMOR': '0.021', 'HITCOUNT': '0.070', 'AMMO4': '0.079', 'weapon4': '0.112', 'AMMO3': '0.131', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.429', 'weapon3': '0.624', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.292'} +[2023-09-14 14:39:25,679][63732] Updated weights for policy 0, policy_version 200 (0.0011) +[2023-09-14 14:39:26,858][63805] DAMAGECOUNT value on done: 415.0 +[2023-09-14 14:39:27,049][63734] DAMAGECOUNT value on done: 653.0 +[2023-09-14 14:39:27,198][63805] DAMAGECOUNT value on done: 306.0 +[2023-09-14 14:39:27,199][63805] Sum rewards: -4.060, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.580', 'WEAPON1': '0.010', 'AMMO2': '0.012', 'weapon5': '0.020', 'AMMO5': '0.022', 'weapon4': '0.026', 'HITCOUNT': '0.030', 'WEAPON4': '0.050', 'AMMO3': '0.059', 'AMMO4': '0.061', 'DAMAGECOUNT': '0.105', 'WEAPON3': '0.300', 'WEAPON5': '0.350', 'weapon3': '0.360', 'FRAGCOUNT': '1.000', 'weapon2': '1.614'} +[2023-09-14 14:39:27,465][63576] Saving new best policy, reward=-6.617! +[2023-09-14 14:39:27,477][63734] DAMAGECOUNT value on done: 200.0 +[2023-09-14 14:39:27,932][63733] Updated weights for policy 1, policy_version 250 (0.0012) +[2023-09-14 14:39:28,279][63767] DAMAGECOUNT value on done: 411.0 +[2023-09-14 14:39:28,280][63767] Sum rewards: -5.215, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.984', 'AMMO2': '0.005', 'AMMO5': '0.009', 'weapon5': '0.016', 'WEAPON1': '0.020', 'AMMO4': '0.024', 'HITCOUNT': '0.040', 'weapon4': '0.086', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.120', 'AMMO3': '0.158', 'WEAPON5': '0.200', 'ARMOR': '0.470', 'WEAPON3': '0.850', 'weapon3': '0.870', 'FRAGCOUNT': '1.000', 'weapon2': '1.050'} +[2023-09-14 14:39:28,619][63771] DAMAGECOUNT value on done: 253.0 +[2023-09-14 14:39:28,678][63767] DAMAGECOUNT value on done: 483.0 +[2023-09-14 14:39:28,679][63767] Sum rewards: -6.509, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.827', 'AMMO2': '0.016', 'AMMO4': '0.078', 'HITCOUNT': '0.080', 'AMMO3': '0.130', 'WEAPON4': '0.150', 'weapon4': '0.390', 'DAMAGECOUNT': '0.405', 'ARMOR': '0.469', 'weapon3': '0.546', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.154'} +[2023-09-14 14:39:28,971][63771] DAMAGECOUNT value on done: 432.0 +[2023-09-14 14:39:28,971][63771] Sum rewards: -12.244, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.820', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.009', 'AMMO2': '0.011', 'weapon5': '0.012', 'weapon4': '0.022', 'AMMO4': '0.056', 'HITCOUNT': '0.070', 'WEAPON4': '0.100', 'AMMO3': '0.139', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.330', 'weapon3': '0.472', 'WEAPON3': '0.750', 'ARMOR': '0.910', 'weapon2': '1.494'} +[2023-09-14 14:39:29,854][63769] DAMAGECOUNT value on done: 494.0 +[2023-09-14 14:39:30,179][63769] DAMAGECOUNT value on done: 290.0 +[2023-09-14 14:39:30,179][63769] Sum rewards: -6.576, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.086', 'weapon5': '0.002', 'AMMO5': '0.005', 'AMMO2': '0.013', 'AMMO4': '0.064', 'AMMO3': '0.065', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.110', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.243', 'WEAPON3': '0.350', 'weapon3': '0.604', 'FRAGCOUNT': '1.000', 'weapon2': '1.404'} +[2023-09-14 14:39:30,487][63770] DAMAGECOUNT value on done: 205.0 +[2023-09-14 14:39:30,488][63770] Sum rewards: -6.232, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.070', 'AMMO5': '0.009', 'AMMO2': '0.016', 'weapon5': '0.028', 'AMMO4': '0.079', 'weapon4': '0.088', 'WEAPON5': '0.100', 'AMMO3': '0.127', 'WEAPON4': '0.200', 'WEAPON3': '0.700', 'weapon3': '0.742', 'weapon2': '0.998'} +[2023-09-14 14:39:30,847][63770] DAMAGECOUNT value on done: 325.0 +[2023-09-14 14:39:31,136][63735] DAMAGECOUNT value on done: 410.0 +[2023-09-14 14:39:31,483][63735] DAMAGECOUNT value on done: 367.0 +[2023-09-14 14:39:31,483][63735] Sum rewards: -7.312, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.316', 'AMMO2': '0.001', 'AMMO5': '0.003', 'AMMO4': '0.007', 'weapon5': '0.010', 'HITCOUNT': '0.050', 'WEAPON5': '0.050', 'ARMOR': '0.056', 'weapon4': '0.094', 'WEAPON4': '0.100', 'AMMO3': '0.103', 'DAMAGECOUNT': '0.132', 'WEAPON3': '0.350', 'weapon3': '0.410', 'weapon2': '1.638'} +[2023-09-14 14:39:31,698][63806] DAMAGECOUNT value on done: 676.0 +[2023-09-14 14:39:32,036][63806] DAMAGECOUNT value on done: 416.0 +[2023-09-14 14:39:32,079][63806] DAMAGECOUNT value on done: 266.0 +[2023-09-14 14:39:32,434][63806] DAMAGECOUNT value on done: 563.0 +[2023-09-14 14:39:32,461][63576] Saving new best policy, reward=-6.367! +[2023-09-14 14:39:32,946][63769] DAMAGECOUNT value on done: 434.0 +[2023-09-14 14:39:33,242][63734] DAMAGECOUNT value on done: 311.0 +[2023-09-14 14:39:33,242][63734] Sum rewards: -1.769, reward structure: {'DEATHCOUNT': '-6.000', 'weapon7': '0.008', 'AMMO2': '0.025', 'weapon4': '0.042', 'HEALTH': '0.044', 'HITCOUNT': '0.050', 'AMMO3': '0.056', 'ARMOR': '0.056', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'DAMAGECOUNT': '0.123', 'AMMO4': '0.126', 'WEAPON4': '0.200', 'WEAPON3': '0.250', 'weapon3': '0.856', 'FRAGCOUNT': '1.000', 'weapon2': '1.094'} +[2023-09-14 14:39:33,267][63769] DAMAGECOUNT value on done: 227.0 +[2023-09-14 14:39:33,268][63769] Sum rewards: -9.022, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.984', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'weapon5': '0.016', 'AMMO2': '0.039', 'HITCOUNT': '0.050', 'WEAPON5': '0.150', 'AMMO3': '0.159', 'DAMAGECOUNT': '0.171', 'weapon4': '0.190', 'AMMO4': '0.194', 'WEAPON4': '0.400', 'WEAPON3': '0.850', 'weapon3': '0.910', 'weapon2': '1.066'} +[2023-09-14 14:39:33,409][63771] DAMAGECOUNT value on done: 472.0 +[2023-09-14 14:39:33,667][63734] DAMAGECOUNT value on done: 227.0 +[2023-09-14 14:39:33,842][63771] DAMAGECOUNT value on done: 347.0 +[2023-09-14 14:39:33,842][63771] Sum rewards: -2.550, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.374', 'HITCOUNT': '0.020', 'AMMO2': '0.040', 'DAMAGECOUNT': '0.057', 'AMMO3': '0.093', 'ARMOR': '0.136', 'AMMO4': '0.201', 'WEAPON3': '0.500', 'WEAPON4': '0.550', 'weapon3': '0.568', 'weapon4': '0.638', 'FRAGCOUNT': '1.000', 'weapon2': '1.020'} +[2023-09-14 14:39:34,049][63733] Updated weights for policy 1, policy_version 260 (0.0012) +[2023-09-14 14:39:34,196][63770] DAMAGECOUNT value on done: 231.0 +[2023-09-14 14:39:34,196][63770] Sum rewards: -2.723, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.720', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.015', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'weapon5': '0.054', 'HITCOUNT': '0.060', 'AMMO3': '0.105', 'weapon4': '0.106', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.450', 'weapon3': '0.730', 'weapon2': '0.914', 'FRAGCOUNT': '1.000'} +[2023-09-14 14:39:34,556][63732] Updated weights for policy 0, policy_version 210 (0.0010) +[2023-09-14 14:39:34,608][63770] DAMAGECOUNT value on done: 474.0 +[2023-09-14 14:39:34,609][63770] Sum rewards: -7.619, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.182', 'AMMO2': '0.021', 'ARMOR': '0.032', 'AMMO4': '0.103', 'HITCOUNT': '0.130', 'AMMO3': '0.152', 'WEAPON4': '0.200', 'weapon4': '0.312', 'DAMAGECOUNT': '0.423', 'weapon3': '0.682', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.008'} +[2023-09-14 14:39:36,710][63805] DAMAGECOUNT value on done: 435.0 +[2023-09-14 14:39:37,109][63805] DAMAGECOUNT value on done: 596.0 +[2023-09-14 14:39:37,466][63576] Saving new best policy, reward=-6.275! +[2023-09-14 14:39:40,288][63733] Updated weights for policy 1, policy_version 270 (0.0012) +[2023-09-14 14:39:43,408][63732] Updated weights for policy 0, policy_version 220 (0.0010) +[2023-09-14 14:39:46,457][63733] Updated weights for policy 1, policy_version 280 (0.0010) +[2023-09-14 14:39:46,470][63735] DAMAGECOUNT value on done: 399.0 +[2023-09-14 14:39:46,797][63735] DAMAGECOUNT value on done: 287.0 +[2023-09-14 14:39:47,583][63767] DAMAGECOUNT value on done: 437.0 +[2023-09-14 14:39:47,584][63767] Sum rewards: -8.293, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.980', 'FRAGCOUNT': '-1.500', 'AMMO2': '0.013', 'AMMO5': '0.019', 'weapon5': '0.052', 'AMMO4': '0.064', 'HITCOUNT': '0.090', 'ARMOR': '0.095', 'AMMO3': '0.139', 'WEAPON4': '0.200', 'weapon4': '0.204', 'DAMAGECOUNT': '0.255', 'WEAPON5': '0.300', 'weapon2': '0.694', 'WEAPON3': '0.700', 'weapon3': '0.862'} +[2023-09-14 14:39:47,956][63767] DAMAGECOUNT value on done: 532.0 +[2023-09-14 14:39:50,318][63805] DAMAGECOUNT value on done: 430.0 +[2023-09-14 14:39:50,318][63805] Sum rewards: -9.257, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.062', 'FRAGCOUNT': '-1.500', 'weapon5': '0.010', 'AMMO5': '0.012', 'HITCOUNT': '0.020', 'AMMO2': '0.036', 'DAMAGECOUNT': '0.045', 'ARMOR': '0.064', 'AMMO3': '0.160', 'AMMO4': '0.178', 'WEAPON5': '0.250', 'WEAPON4': '0.450', 'weapon4': '0.458', 'weapon3': '0.670', 'WEAPON3': '0.800', 'weapon2': '0.902'} +[2023-09-14 14:39:50,645][63805] DAMAGECOUNT value on done: 306.0 +[2023-09-14 14:39:51,078][63734] DAMAGECOUNT value on done: 678.0 +[2023-09-14 14:39:51,480][63734] DAMAGECOUNT value on done: 370.0 +[2023-09-14 14:39:51,481][63734] Sum rewards: -2.105, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO2': '0.019', 'AMMO4': '0.093', 'AMMO3': '0.098', 'HEALTH': '0.107', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'weapon4': '0.214', 'ARMOR': '0.436', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.510', 'weapon3': '0.848', 'FRAGCOUNT': '1.000', 'weapon2': '1.290'} +[2023-09-14 14:39:51,674][63767] DAMAGECOUNT value on done: 611.0 +[2023-09-14 14:39:51,674][63767] Sum rewards: -6.341, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.832', 'AMMO2': '0.008', 'weapon4': '0.018', 'ARMOR': '0.024', 'AMMO4': '0.038', 'WEAPON4': '0.100', 'AMMO3': '0.151', 'HITCOUNT': '0.190', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.850', 'weapon2': '1.150', 'weapon3': '1.362', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:39:52,083][63767] DAMAGECOUNT value on done: 543.0 +[2023-09-14 14:39:52,084][63767] Sum rewards: -8.489, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.994', 'AMMO5': '0.003', 'weapon5': '0.010', 'AMMO2': '0.012', 'ARMOR': '0.016', 'weapon4': '0.020', 'WEAPON5': '0.050', 'AMMO4': '0.059', 'HITCOUNT': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.161', 'DAMAGECOUNT': '0.180', 'weapon3': '0.642', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.572'} +[2023-09-14 14:39:52,290][63771] DAMAGECOUNT value on done: 278.0 +[2023-09-14 14:39:52,308][63732] Updated weights for policy 0, policy_version 230 (0.0012) +[2023-09-14 14:39:52,462][63576] Saving new best policy, reward=-6.260! +[2023-09-14 14:39:52,648][63733] Updated weights for policy 1, policy_version 290 (0.0012) +[2023-09-14 14:39:52,684][63771] DAMAGECOUNT value on done: 687.0 +[2023-09-14 14:39:52,685][63771] Sum rewards: -6.425, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.572', 'AMMO5': '0.007', 'AMMO2': '0.017', 'ARMOR': '0.028', 'AMMO4': '0.086', 'AMMO3': '0.145', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'weapon4': '0.188', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.765', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.000', 'weapon3': '1.110'} +[2023-09-14 14:39:53,248][63770] DAMAGECOUNT value on done: 255.0 +[2023-09-14 14:39:53,322][63769] DAMAGECOUNT value on done: 514.0 +[2023-09-14 14:39:53,591][63770] DAMAGECOUNT value on done: 360.0 +[2023-09-14 14:39:53,592][63770] Sum rewards: -10.518, reward structure: {'DEATHCOUNT': '-12.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.450', 'AMMO5': '0.009', 'AMMO2': '0.010', 'weapon5': '0.028', 'HITCOUNT': '0.030', 'weapon4': '0.034', 'AMMO4': '0.048', 'WEAPON4': '0.050', 'ARMOR': '0.056', 'DAMAGECOUNT': '0.105', 'WEAPON5': '0.150', 'AMMO3': '0.179', 'weapon3': '0.852', 'WEAPON3': '0.900', 'weapon2': '0.980'} +[2023-09-14 14:39:53,638][63769] DAMAGECOUNT value on done: 374.0 +[2023-09-14 14:39:53,638][63769] Sum rewards: -5.648, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.260', 'AMMO5': '0.005', 'AMMO2': '0.019', 'weapon5': '0.030', 'HITCOUNT': '0.070', 'AMMO4': '0.092', 'WEAPON5': '0.100', 'AMMO3': '0.114', 'WEAPON4': '0.150', 'weapon4': '0.176', 'DAMAGECOUNT': '0.252', 'WEAPON3': '0.600', 'weapon3': '0.604', 'FRAGCOUNT': '1.000', 'weapon2': '1.150'} +[2023-09-14 14:39:55,748][63735] DAMAGECOUNT value on done: 522.0 +[2023-09-14 14:39:55,748][63735] Sum rewards: -7.142, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.968', 'AMMO2': '0.007', 'AMMO5': '0.009', 'AMMO4': '0.034', 'HITCOUNT': '0.090', 'weapon5': '0.100', 'AMMO3': '0.124', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'weapon4': '0.232', 'DAMAGECOUNT': '0.336', 'WEAPON3': '0.450', 'weapon3': '0.484', 'FRAGCOUNT': '1.000', 'weapon2': '1.360'} +[2023-09-14 14:39:56,088][63806] DAMAGECOUNT value on done: 781.0 +[2023-09-14 14:39:56,088][63806] Sum rewards: 0.056, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-0.443', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'ARMOR': '0.036', 'HITCOUNT': '0.060', 'AMMO3': '0.065', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.315', 'weapon3': '0.800', 'weapon2': '0.948', 'FRAGCOUNT': '1.000'} +[2023-09-14 14:39:56,143][63735] DAMAGECOUNT value on done: 487.0 +[2023-09-14 14:39:56,143][63735] Sum rewards: -4.359, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.023', 'AMMO5': '0.004', 'AMMO2': '0.017', 'HITCOUNT': '0.060', 'AMMO4': '0.082', 'weapon5': '0.086', 'AMMO3': '0.099', 'WEAPON5': '0.100', 'ARMOR': '0.112', 'weapon4': '0.188', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.450', 'weapon3': '0.548', 'FRAGCOUNT': '1.000', 'weapon2': '1.058'} +[2023-09-14 14:39:56,359][63769] DAMAGECOUNT value on done: 504.0 +[2023-09-14 14:39:56,455][63806] DAMAGECOUNT value on done: 416.0 +[2023-09-14 14:39:56,506][63806] DAMAGECOUNT value on done: 316.0 +[2023-09-14 14:39:56,720][63769] DAMAGECOUNT value on done: 267.0 +[2023-09-14 14:39:56,864][63806] DAMAGECOUNT value on done: 597.0 +[2023-09-14 14:39:56,864][63806] Sum rewards: -6.710, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.580', 'AMMO5': '0.005', 'AMMO2': '0.018', 'HITCOUNT': '0.040', 'ARMOR': '0.056', 'AMMO4': '0.091', 'DAMAGECOUNT': '0.102', 'weapon4': '0.110', 'AMMO3': '0.118', 'WEAPON4': '0.200', 'weapon3': '0.638', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.592'} +[2023-09-14 14:39:57,466][63576] Saving new best policy, reward=-6.236! +[2023-09-14 14:39:58,650][63771] DAMAGECOUNT value on done: 517.0 +[2023-09-14 14:39:58,666][63734] DAMAGECOUNT value on done: 336.0 +[2023-09-14 14:39:58,837][63733] Updated weights for policy 1, policy_version 300 (0.0011) +[2023-09-14 14:39:59,050][63771] DAMAGECOUNT value on done: 402.0 +[2023-09-14 14:39:59,063][63734] DAMAGECOUNT value on done: 294.0 +[2023-09-14 14:39:59,063][63734] Sum rewards: -5.722, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.174', 'AMMO2': '0.006', 'AMMO5': '0.010', 'weapon5': '0.016', 'ARMOR': '0.028', 'AMMO4': '0.030', 'HITCOUNT': '0.070', 'AMMO3': '0.091', 'WEAPON4': '0.100', 'weapon4': '0.126', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.201', 'WEAPON3': '0.500', 'weapon3': '0.714', 'FRAGCOUNT': '1.000', 'weapon2': '1.410'} +[2023-09-14 14:39:59,134][63770] DAMAGECOUNT value on done: 241.0 +[2023-09-14 14:39:59,563][63770] DAMAGECOUNT value on done: 534.0 +[2023-09-14 14:40:01,235][63732] Updated weights for policy 0, policy_version 240 (0.0011) +[2023-09-14 14:40:01,649][63805] DAMAGECOUNT value on done: 495.0 +[2023-09-14 14:40:01,650][63805] Sum rewards: -4.256, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.045', 'AMMO5': '0.005', 'AMMO2': '0.021', 'WEAPON5': '0.050', 'ARMOR': '0.060', 'HITCOUNT': '0.060', 'weapon4': '0.062', 'AMMO3': '0.071', 'AMMO4': '0.106', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.180', 'WEAPON3': '0.350', 'weapon3': '0.422', 'FRAGCOUNT': '1.000', 'weapon2': '1.752'} +[2023-09-14 14:40:02,052][63805] DAMAGECOUNT value on done: 756.0 +[2023-09-14 14:40:02,053][63805] Sum rewards: -8.149, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.190', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.013', 'weapon4': '0.020', 'ARMOR': '0.048', 'AMMO4': '0.063', 'weapon5': '0.068', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'WEAPON5': '0.150', 'AMMO3': '0.184', 'DAMAGECOUNT': '0.480', 'weapon3': '0.802', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.286'} +[2023-09-14 14:40:04,909][63733] Updated weights for policy 1, policy_version 310 (0.0013) +[2023-09-14 14:40:08,537][63735] DAMAGECOUNT value on done: 524.0 +[2023-09-14 14:40:08,538][63735] Sum rewards: -3.630, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO5': '0.003', 'AMMO2': '0.013', 'weapon5': '0.022', 'WEAPON5': '0.050', 'weapon4': '0.052', 'AMMO4': '0.067', 'AMMO3': '0.084', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'HEALTH': '0.290', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.450', 'weapon3': '0.932', 'FRAGCOUNT': '1.000', 'weapon2': '1.082'} +[2023-09-14 14:40:08,879][63735] DAMAGECOUNT value on done: 367.0 +[2023-09-14 14:40:08,880][63735] Sum rewards: -4.753, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.262', 'AMMO5': '0.009', 'AMMO2': '0.026', 'ARMOR': '0.044', 'HITCOUNT': '0.050', 'weapon5': '0.050', 'weapon4': '0.052', 'AMMO3': '0.083', 'AMMO4': '0.130', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.240', 'WEAPON3': '0.400', 'weapon3': '0.786', 'FRAGCOUNT': '1.000', 'weapon2': '1.238'} +[2023-09-14 14:40:09,155][63767] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:40:09,852][63767] DAMAGECOUNT value on done: 437.0 +[2023-09-14 14:40:10,008][63732] Updated weights for policy 0, policy_version 250 (0.0011) +[2023-09-14 14:40:10,235][63767] DAMAGECOUNT value on done: 627.0 +[2023-09-14 14:40:10,236][63767] Sum rewards: -11.783, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-3.000', 'HEALTH': '-1.900', 'AMMO4': '-0.040', 'AMMO2': '-0.008', 'AMMO5': '0.007', 'weapon5': '0.014', 'ARMOR': '0.036', 'HITCOUNT': '0.080', 'WEAPON5': '0.150', 'AMMO3': '0.170', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.750', 'weapon3': '0.850', 'weapon2': '1.322'} +[2023-09-14 14:40:10,990][63733] Updated weights for policy 1, policy_version 320 (0.0013) +[2023-09-14 14:40:13,674][63805] DAMAGECOUNT value on done: 430.0 +[2023-09-14 14:40:14,061][63805] DAMAGECOUNT value on done: 538.0 +[2023-09-14 14:40:14,665][63734] DAMAGECOUNT value on done: 754.0 +[2023-09-14 14:40:14,666][63734] Sum rewards: 0.013, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.462', 'AMMO5': '0.003', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'weapon5': '0.038', 'weapon7': '0.042', 'WEAPON5': '0.050', 'ARMOR': '0.052', 'AMMO3': '0.070', 'HITCOUNT': '0.090', 'AMMO4': '0.092', 'WEAPON4': '0.150', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.228', 'WEAPON3': '0.400', 'weapon4': '0.420', 'weapon3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.032'} +[2023-09-14 14:40:14,719][63767] DAMAGECOUNT value on done: 716.0 +[2023-09-14 14:40:14,720][63767] Sum rewards: -0.510, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.439', 'AMMO2': '0.021', 'AMMO3': '0.092', 'AMMO4': '0.106', 'HITCOUNT': '0.120', 'WEAPON4': '0.200', 'weapon4': '0.212', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.450', 'weapon2': '1.034', 'weapon3': '1.128', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:40:15,015][63734] DAMAGECOUNT value on done: 505.0 +[2023-09-14 14:40:15,016][63734] Sum rewards: -6.053, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.688', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO2': '0.022', 'weapon5': '0.024', 'ARMOR': '0.060', 'HITCOUNT': '0.080', 'AMMO4': '0.109', 'WEAPON5': '0.150', 'AMMO3': '0.159', 'WEAPON4': '0.200', 'weapon4': '0.234', 'DAMAGECOUNT': '0.405', 'weapon3': '0.660', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.452'} +[2023-09-14 14:40:15,066][63767] DAMAGECOUNT value on done: 751.0 +[2023-09-14 14:40:15,066][63767] Sum rewards: -2.996, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.042', 'AMMO5': '0.010', 'AMMO2': '0.040', 'AMMO3': '0.078', 'HITCOUNT': '0.080', 'weapon5': '0.144', 'weapon4': '0.176', 'AMMO4': '0.198', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'weapon3': '0.298', 'WEAPON3': '0.400', 'ARMOR': '0.432', 'DAMAGECOUNT': '0.624', 'FRAGCOUNT': '1.000', 'weapon2': '1.366'} +[2023-09-14 14:40:15,876][63770] DAMAGECOUNT value on done: 279.0 +[2023-09-14 14:40:15,876][63770] Sum rewards: -4.207, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.430', 'AMMO5': '0.005', 'AMMO2': '0.011', 'weapon5': '0.018', 'WEAPON1': '0.020', 'HITCOUNT': '0.030', 'ARMOR': '0.040', 'AMMO4': '0.057', 'AMMO3': '0.072', 'DAMAGECOUNT': '0.072', 'WEAPON5': '0.100', 'weapon4': '0.136', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon3': '0.510', 'FRAGCOUNT': '1.000', 'weapon2': '1.302'} +[2023-09-14 14:40:15,931][63771] DAMAGECOUNT value on done: 298.0 +[2023-09-14 14:40:16,250][63771] DAMAGECOUNT value on done: 766.0 +[2023-09-14 14:40:16,252][63770] DAMAGECOUNT value on done: 370.0 +[2023-09-14 14:40:16,511][63769] DAMAGECOUNT value on done: 564.0 +[2023-09-14 14:40:16,843][63769] DAMAGECOUNT value on done: 489.0 +[2023-09-14 14:40:16,844][63769] Sum rewards: -6.617, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.900', 'AMMO5': '0.005', 'AMMO2': '0.019', 'weapon5': '0.040', 'HITCOUNT': '0.070', 'AMMO4': '0.092', 'WEAPON5': '0.100', 'AMMO3': '0.119', 'WEAPON4': '0.150', 'weapon4': '0.158', 'DAMAGECOUNT': '0.345', 'WEAPON3': '0.650', 'weapon3': '0.718', 'FRAGCOUNT': '1.000', 'weapon2': '1.568'} +[2023-09-14 14:40:17,059][63733] Updated weights for policy 1, policy_version 330 (0.0011) +[2023-09-14 14:40:17,468][63576] Saving new best policy, reward=-6.185! +[2023-09-14 14:40:18,824][63732] Updated weights for policy 0, policy_version 260 (0.0010) +[2023-09-14 14:40:19,598][63769] DAMAGECOUNT value on done: 549.0 +[2023-09-14 14:40:19,599][63769] Sum rewards: -5.427, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.076', 'AMMO5': '0.003', 'weapon5': '0.006', 'AMMO2': '0.020', 'WEAPON5': '0.050', 'HITCOUNT': '0.050', 'AMMO4': '0.098', 'AMMO3': '0.115', 'DAMAGECOUNT': '0.135', 'ARMOR': '0.400', 'WEAPON3': '0.650', 'weapon2': '1.156', 'weapon3': '1.466'} +[2023-09-14 14:40:19,928][63769] DAMAGECOUNT value on done: 295.0 +[2023-09-14 14:40:19,992][63735] DAMAGECOUNT value on done: 641.0 +[2023-09-14 14:40:19,993][63735] Sum rewards: 0.354, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-0.090', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'ARMOR': '0.028', 'WEAPON5': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.080', 'WEAPON3': '0.250', 'DAMAGECOUNT': '0.357', 'weapon3': '0.974', 'FRAGCOUNT': '1.000', 'weapon2': '1.400'} +[2023-09-14 14:40:20,376][63735] DAMAGECOUNT value on done: 662.0 +[2023-09-14 14:40:20,377][63735] Sum rewards: -1.505, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.570', 'AMMO2': '0.008', 'AMMO5': '0.010', 'HITCOUNT': '0.040', 'AMMO4': '0.041', 'WEAPON4': '0.050', 'weapon4': '0.056', 'weapon5': '0.088', 'WEAPON5': '0.100', 'AMMO3': '0.104', 'WEAPON3': '0.350', 'ARMOR': '0.400', 'DAMAGECOUNT': '0.525', 'weapon3': '0.612', 'weapon2': '1.430', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:40:20,565][63806] DAMAGECOUNT value on done: 926.0 +[2023-09-14 14:40:20,566][63806] Sum rewards: -5.633, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.638', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.024', 'ARMOR': '0.076', 'weapon4': '0.080', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.117', 'AMMO3': '0.120', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.550', 'weapon3': '0.610', 'FRAGCOUNT': '1.000', 'weapon2': '1.430'} +[2023-09-14 14:40:20,952][63806] DAMAGECOUNT value on done: 561.0 +[2023-09-14 14:40:20,952][63806] Sum rewards: -7.367, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.822', 'ARMOR': '0.010', 'AMMO2': '0.021', 'HITCOUNT': '0.100', 'AMMO4': '0.107', 'weapon4': '0.124', 'AMMO3': '0.148', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.435', 'weapon3': '0.552', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.408'} +[2023-09-14 14:40:20,998][63806] DAMAGECOUNT value on done: 406.0 +[2023-09-14 14:40:20,998][63806] Sum rewards: -3.244, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.744', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO2': '0.027', 'WEAPON5': '0.050', 'ARMOR': '0.064', 'HITCOUNT': '0.070', 'AMMO3': '0.114', 'AMMO4': '0.132', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.270', 'weapon4': '0.402', 'WEAPON3': '0.650', 'weapon2': '0.970', 'weapon3': '0.996', 'FRAGCOUNT': '1.000'} +[2023-09-14 14:40:21,373][63806] DAMAGECOUNT value on done: 618.0 +[2023-09-14 14:40:21,374][63806] Sum rewards: -9.688, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-0.914', 'AMMO5': '0.003', 'HITCOUNT': '0.020', 'WEAPON1': '0.020', 'AMMO2': '0.021', 'ARMOR': '0.041', 'WEAPON5': '0.050', 'DAMAGECOUNT': '0.063', 'weapon4': '0.104', 'AMMO4': '0.106', 'AMMO3': '0.122', 'WEAPON4': '0.200', 'WEAPON3': '0.650', 'weapon3': '0.840', 'FRAGCOUNT': '1.000', 'weapon2': '1.486'} +[2023-09-14 14:40:22,461][63576] Saving new best policy, reward=-6.070! +[2023-09-14 14:40:23,181][63733] Updated weights for policy 1, policy_version 340 (0.0010) +[2023-09-14 14:40:23,517][63771] DAMAGECOUNT value on done: 587.0 +[2023-09-14 14:40:23,518][63771] Sum rewards: -10.440, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-3.190', 'AMMO2': '0.006', 'ARMOR': '0.032', 'AMMO4': '0.032', 'weapon4': '0.034', 'HITCOUNT': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.207', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.022', 'weapon2': '1.126'} +[2023-09-14 14:40:23,546][63734] DAMAGECOUNT value on done: 486.0 +[2023-09-14 14:40:23,546][63734] Sum rewards: -7.179, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.364', 'AMMO5': '0.003', 'AMMO2': '0.010', 'WEAPON1': '0.020', 'HITCOUNT': '0.040', 'weapon4': '0.042', 'AMMO4': '0.052', 'WEAPON5': '0.100', 'weapon5': '0.106', 'AMMO3': '0.124', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.550', 'weapon3': '0.606', 'FRAGCOUNT': '1.000', 'weapon2': '1.432'} +[2023-09-14 14:40:23,900][63771] DAMAGECOUNT value on done: 472.0 +[2023-09-14 14:40:23,936][63734] DAMAGECOUNT value on done: 328.0 +[2023-09-14 14:40:23,937][63734] Sum rewards: -7.742, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.742', 'AMMO2': '0.017', 'HITCOUNT': '0.030', 'weapon4': '0.064', 'AMMO4': '0.083', 'AMMO3': '0.100', 'DAMAGECOUNT': '0.102', 'WEAPON4': '0.150', 'WEAPON3': '0.500', 'weapon3': '0.990', 'FRAGCOUNT': '1.000', 'weapon2': '1.464'} +[2023-09-14 14:40:24,152][63770] DAMAGECOUNT value on done: 257.0 +[2023-09-14 14:40:24,566][63770] DAMAGECOUNT value on done: 549.0 +[2023-09-14 14:40:26,554][63805] DAMAGECOUNT value on done: 529.0 +[2023-09-14 14:40:26,554][63805] Sum rewards: -9.187, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.190', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.007', 'AMMO2': '0.011', 'weapon5': '0.012', 'WEAPON1': '0.020', 'HITCOUNT': '0.030', 'weapon4': '0.036', 'ARMOR': '0.040', 'AMMO4': '0.054', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.102', 'AMMO3': '0.193', 'weapon3': '0.786', 'WEAPON3': '0.900', 'weapon2': '1.362'} +[2023-09-14 14:40:26,969][63805] DAMAGECOUNT value on done: 1022.0 +[2023-09-14 14:40:26,969][63805] Sum rewards: -3.183, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.892', 'AMMO5': '0.010', 'AMMO2': '0.014', 'ARMOR': '0.024', 'weapon5': '0.052', 'AMMO4': '0.071', 'WEAPON5': '0.100', 'AMMO3': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'weapon4': '0.288', 'DAMAGECOUNT': '0.798', 'WEAPON3': '0.850', 'weapon2': '0.952', 'weapon3': '1.080', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:40:27,465][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000269_1101824.pth... +[2023-09-14 14:40:27,518][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000347_1421312.pth... +[2023-09-14 14:40:27,574][63576] Saving new best policy, reward=-6.055! +[2023-09-14 14:40:27,770][63732] Updated weights for policy 0, policy_version 270 (0.0011) +[2023-09-14 14:40:29,360][63733] Updated weights for policy 1, policy_version 350 (0.0012) +[2023-09-14 14:40:30,529][63735] DAMAGECOUNT value on done: 575.0 +[2023-09-14 14:40:30,899][63735] DAMAGECOUNT value on done: 576.0 +[2023-09-14 14:40:30,899][63735] Sum rewards: -5.638, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.396', 'AMMO2': '0.017', 'ARMOR': '0.071', 'AMMO4': '0.083', 'weapon4': '0.086', 'AMMO3': '0.180', 'WEAPON4': '0.200', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.627', 'weapon3': '0.942', 'WEAPON3': '1.000', 'weapon2': '1.092', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:40:32,310][63767] DAMAGECOUNT value on done: 482.0 +[2023-09-14 14:40:32,310][63767] Sum rewards: -8.822, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.486', 'AMMO2': '0.021', 'HITCOUNT': '0.040', 'weapon4': '0.046', 'AMMO4': '0.103', 'ARMOR': '0.108', 'DAMAGECOUNT': '0.135', 'WEAPON4': '0.150', 'AMMO3': '0.203', 'weapon3': '0.624', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.284'} +[2023-09-14 14:40:32,623][63767] DAMAGECOUNT value on done: 682.0 +[2023-09-14 14:40:32,624][63767] Sum rewards: -6.076, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.830', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'AMMO5': '0.003', 'HITCOUNT': '0.050', 'AMMO3': '0.132', 'DAMAGECOUNT': '0.165', 'ARMOR': '0.487', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.096', 'weapon2': '1.152'} +[2023-09-14 14:40:35,054][63733] Updated weights for policy 1, policy_version 360 (0.0011) +[2023-09-14 14:40:37,053][63805] DAMAGECOUNT value on done: 455.0 +[2023-09-14 14:40:37,433][63805] DAMAGECOUNT value on done: 578.0 +[2023-09-14 14:40:37,595][63732] Updated weights for policy 0, policy_version 280 (0.0012) +[2023-09-14 14:40:37,985][63767] DAMAGECOUNT value on done: 931.0 +[2023-09-14 14:40:37,986][63767] Sum rewards: -2.765, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.392', 'AMMO5': '0.007', 'AMMO2': '0.009', 'ARMOR': '0.009', 'weapon5': '0.010', 'weapon4': '0.022', 'AMMO4': '0.042', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'AMMO3': '0.130', 'HITCOUNT': '0.130', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.750', 'weapon2': '0.920', 'weapon3': '1.552', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:40:38,284][63770] DAMAGECOUNT value on done: 299.0 +[2023-09-14 14:40:38,377][63734] DAMAGECOUNT value on done: 824.0 +[2023-09-14 14:40:38,383][63767] DAMAGECOUNT value on done: 830.0 +[2023-09-14 14:40:38,383][63767] Sum rewards: -5.861, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.986', 'AMMO2': '0.018', 'HITCOUNT': '0.070', 'ARMOR': '0.072', 'AMMO4': '0.087', 'AMMO3': '0.127', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.237', 'weapon4': '0.272', 'WEAPON3': '0.650', 'weapon3': '0.896', 'FRAGCOUNT': '1.000', 'weapon2': '1.246'} +[2023-09-14 14:40:38,639][63770] DAMAGECOUNT value on done: 396.0 +[2023-09-14 14:40:38,756][63734] DAMAGECOUNT value on done: 561.0 +[2023-09-14 14:40:38,757][63734] Sum rewards: -5.827, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.650', 'AMMO5': '0.004', 'AMMO2': '0.009', 'ARMOR': '0.035', 'weapon5': '0.038', 'AMMO4': '0.043', 'HITCOUNT': '0.050', 'AMMO3': '0.088', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.168', 'WEAPON4': '0.200', 'weapon4': '0.252', 'WEAPON3': '0.500', 'weapon3': '0.998', 'FRAGCOUNT': '1.000', 'weapon2': '1.338'} +[2023-09-14 14:40:39,462][63771] DAMAGECOUNT value on done: 408.0 +[2023-09-14 14:40:39,814][63771] DAMAGECOUNT value on done: 826.0 +[2023-09-14 14:40:39,814][63771] Sum rewards: -4.640, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.456', 'AMMO5': '0.005', 'AMMO2': '0.009', 'WEAPON1': '0.020', 'weapon5': '0.022', 'AMMO4': '0.045', 'HITCOUNT': '0.050', 'AMMO3': '0.091', 'WEAPON5': '0.100', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.180', 'weapon4': '0.206', 'ARMOR': '0.476', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.020', 'weapon2': '1.142'} +[2023-09-14 14:40:39,938][63769] DAMAGECOUNT value on done: 597.0 +[2023-09-14 14:40:40,342][63769] DAMAGECOUNT value on done: 509.0 +[2023-09-14 14:40:40,714][63733] Updated weights for policy 1, policy_version 370 (0.0013) +[2023-09-14 14:40:43,095][63769] DAMAGECOUNT value on done: 676.0 +[2023-09-14 14:40:43,096][63769] Sum rewards: -4.532, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.450', 'AMMO5': '0.003', 'weapon5': '0.004', 'WEAPON1': '0.010', 'AMMO2': '0.028', 'weapon4': '0.032', 'WEAPON5': '0.050', 'ARMOR': '0.055', 'AMMO3': '0.095', 'HITCOUNT': '0.120', 'AMMO4': '0.139', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.381', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.036', 'weapon2': '1.266'} +[2023-09-14 14:40:43,421][63769] DAMAGECOUNT value on done: 339.0 +[2023-09-14 14:40:44,410][63735] DAMAGECOUNT value on done: 696.0 +[2023-09-14 14:40:44,743][63735] DAMAGECOUNT value on done: 677.0 +[2023-09-14 14:40:45,183][63806] DAMAGECOUNT value on done: 926.0 +[2023-09-14 14:40:45,540][63806] DAMAGECOUNT value on done: 621.0 +[2023-09-14 14:40:45,583][63806] DAMAGECOUNT value on done: 472.0 +[2023-09-14 14:40:45,894][63806] DAMAGECOUNT value on done: 663.0 +[2023-09-14 14:40:46,785][63733] Updated weights for policy 1, policy_version 380 (0.0011) +[2023-09-14 14:40:46,871][63732] Updated weights for policy 0, policy_version 290 (0.0010) +[2023-09-14 14:40:47,466][63576] Saving new best policy, reward=-6.031! +[2023-09-14 14:40:48,580][63771] DAMAGECOUNT value on done: 692.0 +[2023-09-14 14:40:48,581][63771] Sum rewards: -5.147, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.171', 'AMMO2': '0.024', 'AMMO3': '0.092', 'HITCOUNT': '0.110', 'AMMO4': '0.120', 'weapon4': '0.142', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.315', 'ARMOR': '0.472', 'WEAPON3': '0.500', 'weapon3': '0.762', 'FRAGCOUNT': '1.000', 'weapon2': '1.186'} +[2023-09-14 14:40:48,894][63734] DAMAGECOUNT value on done: 511.0 +[2023-09-14 14:40:48,988][63771] DAMAGECOUNT value on done: 509.0 +[2023-09-14 14:40:49,222][63770] DAMAGECOUNT value on done: 257.0 +[2023-09-14 14:40:49,223][63770] Sum rewards: -9.235, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.799', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.007', 'AMMO2': '0.011', 'weapon5': '0.018', 'ARMOR': '0.044', 'weapon4': '0.050', 'AMMO4': '0.053', 'AMMO3': '0.127', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon3': '0.598', 'WEAPON3': '0.600', 'weapon2': '1.256'} +[2023-09-14 14:40:49,317][63734] DAMAGECOUNT value on done: 578.0 +[2023-09-14 14:40:49,318][63734] Sum rewards: -4.419, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.060', 'weapon5': '0.002', 'AMMO5': '0.007', 'AMMO2': '0.015', 'weapon4': '0.072', 'AMMO4': '0.073', 'ARMOR': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.150', 'AMMO3': '0.183', 'DAMAGECOUNT': '0.750', 'WEAPON3': '0.950', 'weapon2': '1.230', 'weapon3': '1.418', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:40:49,655][63770] DAMAGECOUNT value on done: 648.0 +[2023-09-14 14:40:51,529][63805] DAMAGECOUNT value on done: 550.0 +[2023-09-14 14:40:51,920][63805] DAMAGECOUNT value on done: 1059.0 +[2023-09-14 14:40:52,462][63576] Saving new best policy, reward=-6.015! +[2023-09-14 14:40:53,571][63735] DAMAGECOUNT value on done: 725.0 +[2023-09-14 14:40:53,572][63735] Sum rewards: -6.895, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.770', 'AMMO2': '0.007', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.035', 'ARMOR': '0.044', 'weapon5': '0.044', 'HITCOUNT': '0.100', 'AMMO3': '0.136', 'WEAPON4': '0.150', 'weapon4': '0.172', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.134', 'weapon2': '1.282'} +[2023-09-14 14:40:53,894][63735] DAMAGECOUNT value on done: 736.0 +[2023-09-14 14:40:53,895][63735] Sum rewards: 0.413, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-0.741', 'AMMO2': '0.015', 'ARMOR': '0.052', 'AMMO4': '0.076', 'AMMO3': '0.086', 'WEAPON4': '0.100', 'weapon4': '0.134', 'HITCOUNT': '0.160', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.500', 'weapon2': '0.852', 'FRAGCOUNT': '1.000', 'weapon3': '1.448'} +[2023-09-14 14:40:53,922][63732] Updated weights for policy 0, policy_version 300 (0.0012) +[2023-09-14 14:40:54,157][63733] Updated weights for policy 1, policy_version 390 (0.0010) +[2023-09-14 14:40:54,761][63767] DAMAGECOUNT value on done: 581.0 +[2023-09-14 14:40:55,086][63767] DAMAGECOUNT value on done: 740.0 +[2023-09-14 14:40:57,467][63576] Saving new best policy, reward=-5.934! +[2023-09-14 14:41:00,199][63732] Updated weights for policy 0, policy_version 310 (0.0012) +[2023-09-14 14:41:00,260][63805] DAMAGECOUNT value on done: 571.0 +[2023-09-14 14:41:00,656][63805] DAMAGECOUNT value on done: 733.0 +[2023-09-14 14:41:00,656][63805] Sum rewards: -4.640, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.746', 'AMMO5': '0.005', 'AMMO2': '0.005', 'weapon5': '0.018', 'AMMO4': '0.026', 'weapon4': '0.070', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.120', 'AMMO3': '0.140', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.600', 'weapon3': '0.854', 'weapon2': '1.602', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:41:00,884][63767] DAMAGECOUNT value on done: 1256.0 +[2023-09-14 14:41:00,884][63767] Sum rewards: -4.573, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.544', 'AMMO5': '0.003', 'AMMO2': '0.028', 'weapon5': '0.034', 'ARMOR': '0.037', 'WEAPON5': '0.050', 'weapon4': '0.092', 'AMMO3': '0.136', 'HITCOUNT': '0.140', 'AMMO4': '0.140', 'WEAPON4': '0.200', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.975', 'weapon2': '1.104', 'weapon3': '1.532'} +[2023-09-14 14:41:01,246][63767] DAMAGECOUNT value on done: 854.0 +[2023-09-14 14:41:01,247][63767] Sum rewards: -6.743, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.834', 'AMMO2': '0.007', 'AMMO5': '0.007', 'weapon5': '0.026', 'HITCOUNT': '0.030', 'AMMO4': '0.035', 'ARMOR': '0.052', 'DAMAGECOUNT': '0.072', 'WEAPON4': '0.100', 'AMMO3': '0.129', 'WEAPON5': '0.150', 'weapon4': '0.312', 'WEAPON3': '0.700', 'weapon2': '0.874', 'weapon3': '1.346'} +[2023-09-14 14:41:01,359][63770] DAMAGECOUNT value on done: 401.0 +[2023-09-14 14:41:01,359][63770] Sum rewards: -4.085, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.192', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'WEAPON4': '0.050', 'ARMOR': '0.052', 'weapon4': '0.072', 'HITCOUNT': '0.080', 'AMMO3': '0.140', 'DAMAGECOUNT': '0.306', 'WEAPON3': '0.650', 'weapon3': '0.664', 'weapon2': '1.344', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:41:01,737][63770] DAMAGECOUNT value on done: 491.0 +[2023-09-14 14:41:01,737][63770] Sum rewards: -6.156, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.020', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'AMMO5': '0.005', 'weapon5': '0.020', 'HITCOUNT': '0.090', 'WEAPON5': '0.100', 'AMMO3': '0.164', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.850', 'weapon3': '0.952', 'FRAGCOUNT': '1.000', 'weapon2': '1.424'} +[2023-09-14 14:41:02,365][63733] Updated weights for policy 1, policy_version 400 (0.0011) +[2023-09-14 14:41:02,461][63576] Saving new best policy, reward=-5.849! +[2023-09-14 14:41:02,696][63771] DAMAGECOUNT value on done: 538.0 +[2023-09-14 14:41:02,697][63771] Sum rewards: -4.509, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.420', 'AMMO2': '0.004', 'AMMO5': '0.010', 'weapon5': '0.010', 'AMMO4': '0.022', 'WEAPON4': '0.050', 'HITCOUNT': '0.080', 'WEAPON5': '0.100', 'weapon4': '0.108', 'AMMO3': '0.132', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.082', 'weapon3': '1.322'} +[2023-09-14 14:41:03,012][63771] DAMAGECOUNT value on done: 871.0 +[2023-09-14 14:41:03,317][63769] DAMAGECOUNT value on done: 627.0 +[2023-09-14 14:41:03,317][63769] Sum rewards: -8.132, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.500', 'AMMO5': '0.005', 'AMMO2': '0.026', 'HITCOUNT': '0.040', 'weapon5': '0.046', 'DAMAGECOUNT': '0.090', 'WEAPON5': '0.100', 'AMMO4': '0.130', 'AMMO3': '0.144', 'WEAPON3': '0.850', 'weapon2': '1.120', 'weapon3': '1.316'} +[2023-09-14 14:41:03,633][63769] DAMAGECOUNT value on done: 529.0 +[2023-09-14 14:41:03,634][63769] Sum rewards: -5.408, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.848', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'HITCOUNT': '0.020', 'AMMO2': '0.035', 'ARMOR': '0.040', 'weapon5': '0.040', 'DAMAGECOUNT': '0.060', 'WEAPON5': '0.100', 'AMMO3': '0.113', 'weapon4': '0.120', 'AMMO4': '0.177', 'WEAPON4': '0.200', 'WEAPON3': '0.600', 'weapon2': '0.850', 'weapon3': '1.320'} +[2023-09-14 14:41:03,717][63734] DAMAGECOUNT value on done: 960.0 +[2023-09-14 14:41:04,154][63734] DAMAGECOUNT value on done: 711.0 +[2023-09-14 14:41:06,590][63732] Updated weights for policy 0, policy_version 320 (0.0011) +[2023-09-14 14:41:07,467][63576] Saving new best policy, reward=-5.664! +[2023-09-14 14:41:07,652][63806] DAMAGECOUNT value on done: 983.0 +[2023-09-14 14:41:07,652][63806] Sum rewards: -8.018, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.654', 'WEAPON1': '0.010', 'AMMO2': '0.039', 'ARMOR': '0.046', 'HITCOUNT': '0.080', 'AMMO3': '0.108', 'weapon4': '0.138', 'DAMAGECOUNT': '0.171', 'AMMO4': '0.194', 'WEAPON4': '0.350', 'WEAPON3': '0.450', 'weapon3': '0.782', 'FRAGCOUNT': '1.000', 'weapon2': '1.268'} +[2023-09-14 14:41:07,995][63806] DAMAGECOUNT value on done: 721.0 +[2023-09-14 14:41:08,041][63806] DAMAGECOUNT value on done: 477.0 +[2023-09-14 14:41:08,075][63769] DAMAGECOUNT value on done: 876.0 +[2023-09-14 14:41:08,075][63769] Sum rewards: -0.375, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO2': '0.003', 'AMMO5': '0.005', 'ARMOR': '0.008', 'AMMO4': '0.013', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.097', 'WEAPON5': '0.100', 'weapon5': '0.138', 'HEALTH': '0.151', 'weapon4': '0.214', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.600', 'weapon3': '0.802', 'weapon2': '0.964', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:41:08,331][63806] DAMAGECOUNT value on done: 768.0 +[2023-09-14 14:41:08,427][63769] DAMAGECOUNT value on done: 468.0 +[2023-09-14 14:41:08,897][63735] DAMAGECOUNT value on done: 731.0 +[2023-09-14 14:41:09,293][63735] DAMAGECOUNT value on done: 817.0 +[2023-09-14 14:41:09,294][63735] Sum rewards: -5.902, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.572', 'AMMO4': '-0.010', 'AMMO2': '-0.002', 'AMMO5': '0.003', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'HITCOUNT': '0.130', 'AMMO3': '0.167', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.800', 'weapon2': '0.946', 'weapon3': '1.626', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:41:10,422][63733] Updated weights for policy 1, policy_version 410 (0.0011) +[2023-09-14 14:41:12,462][63576] Saving new best policy, reward=-5.599! +[2023-09-14 14:41:12,538][63770] DAMAGECOUNT value on done: 302.0 +[2023-09-14 14:41:12,671][63734] DAMAGECOUNT value on done: 640.0 +[2023-09-14 14:41:12,671][63734] Sum rewards: -7.568, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.380', 'AMMO5': '0.010', 'AMMO2': '0.016', 'ARMOR': '0.032', 'WEAPON1': '0.040', 'AMMO4': '0.080', 'weapon4': '0.090', 'HITCOUNT': '0.100', 'AMMO3': '0.127', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.387', 'WEAPON3': '0.700', 'weapon3': '0.910', 'FRAGCOUNT': '1.000', 'weapon2': '1.170'} +[2023-09-14 14:41:12,883][63732] Updated weights for policy 0, policy_version 330 (0.0010) +[2023-09-14 14:41:12,905][63770] DAMAGECOUNT value on done: 682.0 +[2023-09-14 14:41:13,062][63734] DAMAGECOUNT value on done: 693.0 +[2023-09-14 14:41:13,063][63734] Sum rewards: -2.003, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.250', 'AMMO5': '0.007', 'AMMO2': '0.011', 'WEAPON1': '0.020', 'weapon4': '0.022', 'weapon5': '0.034', 'AMMO4': '0.054', 'ARMOR': '0.076', 'AMMO3': '0.099', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.345', 'WEAPON3': '0.600', 'weapon2': '0.778', 'FRAGCOUNT': '1.000', 'weapon3': '1.150'} +[2023-09-14 14:41:13,629][63771] DAMAGECOUNT value on done: 947.0 +[2023-09-14 14:41:13,629][63771] Sum rewards: -2.109, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.370', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.025', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'AMMO3': '0.123', 'HITCOUNT': '0.250', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.765', 'weapon2': '1.104', 'weapon3': '1.128', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:41:13,943][63771] DAMAGECOUNT value on done: 664.0 +[2023-09-14 14:41:13,944][63771] Sum rewards: -1.548, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.348', 'AMMO5': '0.005', 'weapon5': '0.024', 'ARMOR': '0.032', 'AMMO2': '0.033', 'AMMO3': '0.080', 'HITCOUNT': '0.090', 'WEAPON5': '0.100', 'AMMO4': '0.163', 'weapon4': '0.178', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.465', 'weapon3': '0.932', 'weapon2': '1.498', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:41:14,740][63805] DAMAGECOUNT value on done: 635.0 +[2023-09-14 14:41:15,122][63805] DAMAGECOUNT value on done: 1083.0 +[2023-09-14 14:41:15,123][63805] Sum rewards: -4.585, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.233', 'AMMO2': '0.003', 'AMMO4': '0.015', 'HITCOUNT': '0.030', 'ARMOR': '0.044', 'DAMAGECOUNT': '0.072', 'AMMO3': '0.106', 'WEAPON3': '0.500', 'weapon3': '0.672', 'FRAGCOUNT': '1.000', 'weapon2': '1.456'} +[2023-09-14 14:41:15,860][63735] DAMAGECOUNT value on done: 798.0 +[2023-09-14 14:41:16,247][63735] DAMAGECOUNT value on done: 856.0 +[2023-09-14 14:41:16,248][63735] Sum rewards: -5.727, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.122', 'AMMO2': '0.016', 'HITCOUNT': '0.060', 'AMMO4': '0.081', 'AMMO3': '0.115', 'WEAPON4': '0.200', 'weapon4': '0.292', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.228', 'weapon2': '1.242'} +[2023-09-14 14:41:17,705][63767] DAMAGECOUNT value on done: 749.0 +[2023-09-14 14:41:18,091][63767] DAMAGECOUNT value on done: 809.0 +[2023-09-14 14:41:18,091][63767] Sum rewards: -7.499, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.792', 'AMMO2': '0.011', 'ARMOR': '0.056', 'AMMO4': '0.056', 'HITCOUNT': '0.080', 'WEAPON4': '0.100', 'weapon4': '0.142', 'AMMO3': '0.188', 'DAMAGECOUNT': '0.207', 'weapon3': '0.500', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.452'} +[2023-09-14 14:41:18,415][63733] Updated weights for policy 1, policy_version 420 (0.0010) +[2023-09-14 14:41:19,197][63732] Updated weights for policy 0, policy_version 340 (0.0010) +[2023-09-14 14:41:22,901][63805] DAMAGECOUNT value on done: 611.0 +[2023-09-14 14:41:23,219][63805] DAMAGECOUNT value on done: 949.0 +[2023-09-14 14:41:23,220][63805] Sum rewards: -4.407, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.350', 'AMMO2': '0.018', 'weapon4': '0.038', 'weapon7': '0.064', 'AMMO4': '0.090', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'HITCOUNT': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.159', 'DAMAGECOUNT': '0.648', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.260', 'weapon2': '1.316'} +[2023-09-14 14:41:23,461][63767] DAMAGECOUNT value on done: 1371.0 +[2023-09-14 14:41:23,462][63767] Sum rewards: -9.176, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.870', 'ARMOR': '0.004', 'AMMO5': '0.007', 'weapon5': '0.010', 'AMMO2': '0.027', 'HITCOUNT': '0.100', 'AMMO4': '0.136', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'AMMO3': '0.220', 'weapon4': '0.330', 'DAMAGECOUNT': '0.345', 'WEAPON3': '1.150', 'weapon2': '1.236', 'weapon3': '1.278', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:41:23,792][63767] DAMAGECOUNT value on done: 989.0 +[2023-09-14 14:41:24,390][63770] DAMAGECOUNT value on done: 521.0 +[2023-09-14 14:41:24,391][63770] Sum rewards: -3.436, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.742', 'AMMO5': '0.007', 'AMMO2': '0.009', 'ARMOR': '0.020', 'weapon4': '0.024', 'WEAPON1': '0.040', 'AMMO4': '0.044', 'HITCOUNT': '0.060', 'weapon5': '0.064', 'WEAPON4': '0.100', 'AMMO3': '0.106', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.108', 'weapon2': '1.114'} +[2023-09-14 14:41:24,745][63770] DAMAGECOUNT value on done: 591.0 +[2023-09-14 14:41:24,746][63770] Sum rewards: -4.710, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.870', 'weapon4': '0.002', 'AMMO2': '0.003', 'AMMO5': '0.009', 'HITCOUNT': '0.010', 'AMMO4': '0.013', 'weapon5': '0.038', 'ARMOR': '0.080', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.135', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.750', 'weapon3': '0.906', 'FRAGCOUNT': '1.000', 'weapon2': '1.214'} +[2023-09-14 14:41:25,489][63771] DAMAGECOUNT value on done: 538.0 +[2023-09-14 14:41:25,522][63732] Updated weights for policy 0, policy_version 350 (0.0011) +[2023-09-14 14:41:25,862][63771] DAMAGECOUNT value on done: 1016.0 +[2023-09-14 14:41:26,092][63769] DAMAGECOUNT value on done: 1033.0 +[2023-09-14 14:41:26,093][63769] Sum rewards: -2.619, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.680', 'AMMO2': '0.003', 'AMMO4': '0.014', 'AMMO3': '0.152', 'HITCOUNT': '0.240', 'weapon2': '0.904', 'WEAPON3': '0.950', 'DAMAGECOUNT': '1.218', 'weapon3': '2.080', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:41:26,432][63769] DAMAGECOUNT value on done: 564.0 +[2023-09-14 14:41:26,432][63769] Sum rewards: -7.240, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.240', 'AMMO5': '0.010', 'AMMO2': '0.030', 'HITCOUNT': '0.030', 'DAMAGECOUNT': '0.105', 'AMMO3': '0.118', 'AMMO4': '0.149', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'weapon4': '0.252', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.020', 'weapon2': '1.436'} +[2023-09-14 14:41:26,447][63733] Updated weights for policy 1, policy_version 430 (0.0012) +[2023-09-14 14:41:28,733][63734] DAMAGECOUNT value on done: 1180.0 +[2023-09-14 14:41:28,733][63734] Sum rewards: -2.780, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.233', 'AMMO2': '0.004', 'AMMO5': '0.012', 'AMMO4': '0.022', 'weapon5': '0.084', 'AMMO3': '0.103', 'HITCOUNT': '0.110', 'WEAPON5': '0.250', 'WEAPON3': '0.550', 'ARMOR': '0.562', 'DAMAGECOUNT': '0.660', 'weapon2': '1.028', 'weapon3': '1.068', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:41:29,129][63734] DAMAGECOUNT value on done: 841.0 +[2023-09-14 14:41:29,963][63806] DAMAGECOUNT value on done: 1013.0 +[2023-09-14 14:41:30,219][63806] DAMAGECOUNT value on done: 820.0 +[2023-09-14 14:41:30,256][63806] DAMAGECOUNT value on done: 626.0 +[2023-09-14 14:41:30,257][63806] Sum rewards: -2.513, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.318', 'AMMO5': '0.007', 'AMMO2': '0.011', 'weapon5': '0.034', 'ARMOR': '0.036', 'AMMO4': '0.056', 'AMMO3': '0.088', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.447', 'weapon3': '0.988', 'FRAGCOUNT': '1.000', 'weapon2': '1.138'} +[2023-09-14 14:41:30,593][63806] DAMAGECOUNT value on done: 873.0 +[2023-09-14 14:41:30,593][63806] Sum rewards: -6.500, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.050', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.011', 'AMMO2': '0.024', 'HITCOUNT': '0.050', 'ARMOR': '0.052', 'weapon4': '0.072', 'AMMO4': '0.120', 'AMMO3': '0.139', 'weapon5': '0.192', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.800', 'weapon3': '1.000', 'weapon2': '1.024'} +[2023-09-14 14:41:31,817][63732] Updated weights for policy 0, policy_version 360 (0.0011) +[2023-09-14 14:41:32,505][63454] Saving new best policy, reward=-6.314! +[2023-09-14 14:41:32,872][63769] DAMAGECOUNT value on done: 906.0 +[2023-09-14 14:41:33,218][63735] DAMAGECOUNT value on done: 740.0 +[2023-09-14 14:41:33,307][63769] DAMAGECOUNT value on done: 483.0 +[2023-09-14 14:41:33,536][63735] DAMAGECOUNT value on done: 917.0 +[2023-09-14 14:41:34,588][63733] Updated weights for policy 1, policy_version 440 (0.0010) +[2023-09-14 14:41:35,436][63770] DAMAGECOUNT value on done: 347.0 +[2023-09-14 14:41:35,437][63770] Sum rewards: -7.550, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.003', 'HITCOUNT': '0.010', 'AMMO2': '0.021', 'weapon5': '0.046', 'WEAPON5': '0.050', 'AMMO3': '0.098', 'AMMO4': '0.103', 'ARMOR': '0.114', 'DAMAGECOUNT': '0.135', 'weapon4': '0.170', 'WEAPON4': '0.200', 'HEALTH': '0.252', 'WEAPON3': '0.500', 'weapon3': '0.650', 'weapon2': '1.348'} +[2023-09-14 14:41:35,824][63770] DAMAGECOUNT value on done: 812.0 +[2023-09-14 14:41:36,129][63734] DAMAGECOUNT value on done: 640.0 +[2023-09-14 14:41:36,129][63734] Sum rewards: -5.132, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.005', 'AMMO2': '0.012', 'weapon5': '0.014', 'ARMOR': '0.048', 'WEAPON5': '0.050', 'AMMO4': '0.060', 'AMMO3': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.140', 'WEAPON3': '0.500', 'HEALTH': '0.721', 'weapon2': '1.048', 'weapon3': '1.070'} +[2023-09-14 14:41:36,524][63734] DAMAGECOUNT value on done: 738.0 +[2023-09-14 14:41:36,525][63734] Sum rewards: -5.306, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.310', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.016', 'HITCOUNT': '0.030', 'ARMOR': '0.032', 'AMMO3': '0.077', 'AMMO4': '0.081', 'weapon4': '0.096', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.135', 'WEAPON4': '0.200', 'WEAPON3': '0.450', 'weapon3': '0.908', 'FRAGCOUNT': '1.000', 'weapon2': '1.114'} +[2023-09-14 14:41:37,499][63454] Saving new best policy, reward=-6.120! +[2023-09-14 14:41:37,874][63805] DAMAGECOUNT value on done: 885.0 +[2023-09-14 14:41:37,874][63805] Sum rewards: -4.246, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.900', 'AMMO5': '0.005', 'AMMO2': '0.007', 'weapon5': '0.018', 'weapon4': '0.026', 'AMMO4': '0.037', 'WEAPON4': '0.050', 'ARMOR': '0.060', 'WEAPON5': '0.100', 'HITCOUNT': '0.130', 'AMMO3': '0.133', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.750', 'weapon2': '1.038', 'weapon3': '1.100', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:41:38,131][63732] Updated weights for policy 0, policy_version 370 (0.0011) +[2023-09-14 14:41:38,242][63735] DAMAGECOUNT value on done: 1038.0 +[2023-09-14 14:41:38,243][63735] Sum rewards: -2.999, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.082', 'AMMO2': '0.011', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'AMMO4': '0.056', 'AMMO3': '0.115', 'HITCOUNT': '0.190', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.720', 'weapon3': '1.004', 'weapon2': '1.504', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:41:38,245][63805] DAMAGECOUNT value on done: 1228.0 +[2023-09-14 14:41:38,245][63805] Sum rewards: -3.678, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.190', 'ARMOR': '0.004', 'AMMO5': '0.005', 'weapon4': '0.016', 'AMMO2': '0.019', 'weapon5': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.095', 'WEAPON5': '0.100', 'AMMO3': '0.102', 'HITCOUNT': '0.120', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.114', 'weapon2': '1.282'} +[2023-09-14 14:41:38,566][63771] DAMAGECOUNT value on done: 1069.0 +[2023-09-14 14:41:38,566][63771] Sum rewards: -2.054, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.856', 'AMMO2': '0.010', 'AMMO4': '0.052', 'AMMO3': '0.090', 'HITCOUNT': '0.100', 'ARMOR': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.114', 'DAMAGECOUNT': '0.366', 'WEAPON3': '0.550', 'weapon3': '0.944', 'FRAGCOUNT': '1.000', 'weapon2': '1.376'} +[2023-09-14 14:41:38,582][63735] DAMAGECOUNT value on done: 966.0 +[2023-09-14 14:41:38,583][63735] Sum rewards: -6.207, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.943', 'AMMO2': '0.014', 'weapon7': '0.020', 'HITCOUNT': '0.060', 'ARMOR': '0.064', 'AMMO4': '0.071', 'weapon4': '0.090', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.223', 'DAMAGECOUNT': '0.330', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon3': '1.184', 'weapon2': '1.480'} +[2023-09-14 14:41:39,006][63771] DAMAGECOUNT value on done: 704.0 +[2023-09-14 14:41:39,007][63771] Sum rewards: -5.376, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.078', 'AMMO2': '0.001', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO4': '0.003', 'HITCOUNT': '0.030', 'ARMOR': '0.032', 'WEAPON5': '0.050', 'DAMAGECOUNT': '0.120', 'AMMO3': '0.150', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.024', 'weapon3': '1.438'} +[2023-09-14 14:41:40,851][63767] DAMAGECOUNT value on done: 758.0 +[2023-09-14 14:41:40,851][63767] Sum rewards: -8.112, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.263', 'AMMO5': '0.003', 'AMMO2': '0.006', 'ARMOR': '0.016', 'HITCOUNT': '0.020', 'DAMAGECOUNT': '0.027', 'WEAPON1': '0.030', 'AMMO4': '0.032', 'WEAPON5': '0.050', 'weapon4': '0.060', 'weapon5': '0.064', 'WEAPON4': '0.100', 'AMMO3': '0.144', 'WEAPON3': '0.800', 'weapon2': '1.090', 'weapon3': '1.208'} +[2023-09-14 14:41:41,194][63767] DAMAGECOUNT value on done: 883.0 +[2023-09-14 14:41:41,195][63767] Sum rewards: -3.778, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.112', 'AMMO5': '0.007', 'ARMOR': '0.012', 'weapon5': '0.016', 'AMMO2': '0.022', 'HITCOUNT': '0.060', 'AMMO4': '0.109', 'AMMO3': '0.116', 'WEAPON5': '0.150', 'weapon4': '0.182', 'DAMAGECOUNT': '0.222', 'WEAPON4': '0.250', 'WEAPON3': '0.650', 'weapon3': '0.912', 'FRAGCOUNT': '1.000', 'weapon2': '1.126'} +[2023-09-14 14:41:42,461][63454] Saving new best policy, reward=-6.004! +[2023-09-14 14:41:42,726][63733] Updated weights for policy 1, policy_version 450 (0.0011) +[2023-09-14 14:41:44,455][63732] Updated weights for policy 0, policy_version 380 (0.0012) +[2023-09-14 14:41:45,326][63805] DAMAGECOUNT value on done: 675.0 +[2023-09-14 14:41:45,326][63805] Sum rewards: -7.577, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.378', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO2': '0.004', 'ARMOR': '0.020', 'AMMO4': '0.022', 'WEAPON5': '0.050', 'HITCOUNT': '0.090', 'WEAPON4': '0.150', 'AMMO3': '0.163', 'DAMAGECOUNT': '0.192', 'weapon4': '0.268', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.224', 'weapon3': '1.262'} +[2023-09-14 14:41:45,689][63805] DAMAGECOUNT value on done: 1034.0 +[2023-09-14 14:41:45,690][63805] Sum rewards: -7.195, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.088', 'AMMO2': '0.002', 'AMMO5': '0.003', 'AMMO4': '0.010', 'WEAPON1': '0.030', 'WEAPON5': '0.050', 'HITCOUNT': '0.080', 'weapon5': '0.096', 'AMMO3': '0.133', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.650', 'weapon3': '1.088', 'weapon2': '1.246'} +[2023-09-14 14:41:46,015][63767] DAMAGECOUNT value on done: 1493.0 +[2023-09-14 14:41:46,016][63767] Sum rewards: -8.856, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.233', 'AMMO2': '0.001', 'AMMO5': '0.003', 'AMMO4': '0.004', 'weapon4': '0.036', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'ARMOR': '0.056', 'HITCOUNT': '0.070', 'AMMO3': '0.185', 'DAMAGECOUNT': '0.366', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.186', 'weapon3': '1.470'} +[2023-09-14 14:41:46,366][63767] DAMAGECOUNT value on done: 1183.0 +[2023-09-14 14:41:46,366][63767] Sum rewards: -3.631, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.226', 'AMMO5': '0.003', 'AMMO2': '0.007', 'weapon5': '0.014', 'AMMO4': '0.037', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO3': '0.068', 'HITCOUNT': '0.120', 'weapon4': '0.146', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.582', 'weapon2': '0.968', 'weapon3': '1.336'} +[2023-09-14 14:41:47,315][63770] DAMAGECOUNT value on done: 531.0 +[2023-09-14 14:41:47,465][63454] Saving new best policy, reward=-5.990! +[2023-09-14 14:41:47,704][63770] DAMAGECOUNT value on done: 646.0 +[2023-09-14 14:41:48,521][63771] DAMAGECOUNT value on done: 638.0 +[2023-09-14 14:41:48,872][63771] DAMAGECOUNT value on done: 1126.0 +[2023-09-14 14:41:48,872][63771] Sum rewards: -6.142, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.248', 'AMMO5': '0.005', 'AMMO2': '0.015', 'weapon4': '0.044', 'AMMO4': '0.076', 'ARMOR': '0.093', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.142', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.278', 'weapon3': '1.472'} +[2023-09-14 14:41:49,066][63769] DAMAGECOUNT value on done: 1117.0 +[2023-09-14 14:41:49,447][63769] DAMAGECOUNT value on done: 629.0 +[2023-09-14 14:41:49,448][63769] Sum rewards: -5.832, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.844', 'AMMO2': '0.007', 'AMMO4': '0.037', 'HITCOUNT': '0.060', 'ARMOR': '0.064', 'AMMO3': '0.149', 'DAMAGECOUNT': '0.195', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.296', 'weapon2': '1.304'} +[2023-09-14 14:41:50,783][63732] Updated weights for policy 0, policy_version 390 (0.0010) +[2023-09-14 14:41:50,825][63733] Updated weights for policy 1, policy_version 460 (0.0012) +[2023-09-14 14:41:52,461][63454] Saving new best policy, reward=-5.909! +[2023-09-14 14:41:52,500][63806] DAMAGECOUNT value on done: 1038.0 +[2023-09-14 14:41:52,874][63806] DAMAGECOUNT value on done: 940.0 +[2023-09-14 14:41:52,923][63806] DAMAGECOUNT value on done: 646.0 +[2023-09-14 14:41:53,203][63806] DAMAGECOUNT value on done: 1038.0 +[2023-09-14 14:41:53,204][63806] Sum rewards: -1.778, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.958', 'AMMO5': '0.005', 'AMMO2': '0.008', 'AMMO4': '0.038', 'ARMOR': '0.040', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.116', 'WEAPON4': '0.150', 'weapon4': '0.234', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.012', 'weapon2': '1.232'} +[2023-09-14 14:41:53,761][63734] DAMAGECOUNT value on done: 1220.0 +[2023-09-14 14:41:54,218][63734] DAMAGECOUNT value on done: 976.0 +[2023-09-14 14:41:54,219][63734] Sum rewards: -4.631, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.744', 'AMMO4': '-0.031', 'AMMO2': '-0.006', 'weapon5': '0.014', 'AMMO5': '0.022', 'HITCOUNT': '0.080', 'AMMO3': '0.098', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.450', 'weapon3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.380'} +[2023-09-14 14:41:57,236][63732] Updated weights for policy 0, policy_version 400 (0.0011) +[2023-09-14 14:41:58,021][63735] DAMAGECOUNT value on done: 765.0 +[2023-09-14 14:41:58,063][63769] DAMAGECOUNT value on done: 956.0 +[2023-09-14 14:41:58,413][63735] DAMAGECOUNT value on done: 962.0 +[2023-09-14 14:41:58,485][63769] DAMAGECOUNT value on done: 593.0 +[2023-09-14 14:41:58,639][63770] DAMAGECOUNT value on done: 512.0 +[2023-09-14 14:41:58,639][63770] Sum rewards: -5.445, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.345', 'AMMO5': '0.003', 'AMMO2': '0.006', 'AMMO4': '0.028', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'weapon4': '0.116', 'AMMO3': '0.129', 'ARMOR': '0.486', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.700', 'weapon3': '0.972', 'FRAGCOUNT': '1.000', 'weapon2': '1.506'} +[2023-09-14 14:41:58,970][63770] DAMAGECOUNT value on done: 907.0 +[2023-09-14 14:41:58,971][63770] Sum rewards: -2.420, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.245', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.014', 'ARMOR': '0.032', 'weapon5': '0.064', 'AMMO4': '0.069', 'HITCOUNT': '0.090', 'AMMO3': '0.131', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'weapon4': '0.282', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.750', 'weapon3': '0.838', 'weapon2': '1.204', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:41:59,118][63733] Updated weights for policy 1, policy_version 470 (0.0011) +[2023-09-14 14:42:00,001][63734] DAMAGECOUNT value on done: 685.0 +[2023-09-14 14:42:00,343][63734] DAMAGECOUNT value on done: 753.0 +[2023-09-14 14:42:00,836][63735] DAMAGECOUNT value on done: 1228.0 +[2023-09-14 14:42:00,836][63735] Sum rewards: -5.979, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.159', 'AMMO5': '0.007', 'AMMO2': '0.009', 'ARMOR': '0.020', 'weapon5': '0.022', 'AMMO4': '0.044', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'AMMO3': '0.166', 'weapon4': '0.170', 'HITCOUNT': '0.200', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.112', 'weapon3': '1.310'} +[2023-09-14 14:42:00,979][63805] DAMAGECOUNT value on done: 920.0 +[2023-09-14 14:42:00,980][63805] Sum rewards: -3.990, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.390', 'AMMO5': '0.003', 'AMMO2': '0.018', 'weapon5': '0.020', 'HITCOUNT': '0.040', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'AMMO3': '0.085', 'AMMO4': '0.088', 'DAMAGECOUNT': '0.105', 'WEAPON4': '0.250', 'weapon4': '0.366', 'WEAPON3': '0.450', 'weapon3': '0.866', 'FRAGCOUNT': '1.000', 'weapon2': '1.270'} +[2023-09-14 14:42:01,216][63735] DAMAGECOUNT value on done: 1211.0 +[2023-09-14 14:42:01,217][63735] Sum rewards: -4.265, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.570', 'AMMO5': '0.005', 'AMMO2': '0.024', 'weapon5': '0.024', 'WEAPON5': '0.100', 'AMMO4': '0.118', 'AMMO3': '0.145', 'HITCOUNT': '0.160', 'WEAPON4': '0.200', 'weapon4': '0.320', 'ARMOR': '0.460', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.735', 'weapon3': '0.792', 'weapon2': '1.122', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:42:01,369][63805] DAMAGECOUNT value on done: 1238.0 +[2023-09-14 14:42:03,652][63732] Updated weights for policy 0, policy_version 410 (0.0011) +[2023-09-14 14:42:03,760][63771] DAMAGECOUNT value on done: 1140.0 +[2023-09-14 14:42:03,938][63767] DAMAGECOUNT value on done: 818.0 +[2023-09-14 14:42:04,145][63771] DAMAGECOUNT value on done: 965.0 +[2023-09-14 14:42:04,146][63771] Sum rewards: -1.629, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.434', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO2': '0.005', 'AMMO4': '0.022', 'weapon4': '0.042', 'WEAPON5': '0.050', 'WEAPON4': '0.100', 'ARMOR': '0.114', 'AMMO3': '0.120', 'HITCOUNT': '0.190', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.783', 'weapon2': '1.188', 'weapon3': '1.536', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:42:04,326][63767] DAMAGECOUNT value on done: 1026.0 +[2023-09-14 14:42:07,190][63733] Updated weights for policy 1, policy_version 480 (0.0012) +[2023-09-14 14:42:07,959][63805] DAMAGECOUNT value on done: 756.0 +[2023-09-14 14:42:08,331][63805] DAMAGECOUNT value on done: 1144.0 +[2023-09-14 14:42:08,332][63805] Sum rewards: -1.709, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.290', 'weapon5': '0.006', 'ARMOR': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.017', 'WEAPON1': '0.020', 'HITCOUNT': '0.060', 'AMMO4': '0.085', 'AMMO3': '0.089', 'WEAPON4': '0.100', 'weapon4': '0.152', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.500', 'weapon2': '0.822', 'FRAGCOUNT': '1.000', 'weapon3': '1.432'} +[2023-09-14 14:42:08,528][63767] DAMAGECOUNT value on done: 1648.0 +[2023-09-14 14:42:08,921][63767] DAMAGECOUNT value on done: 1353.0 +[2023-09-14 14:42:10,113][63732] Updated weights for policy 0, policy_version 420 (0.0011) +[2023-09-14 14:42:10,762][63770] DAMAGECOUNT value on done: 701.0 +[2023-09-14 14:42:10,763][63770] Sum rewards: -2.160, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.112', 'AMMO2': '0.025', 'AMMO3': '0.105', 'AMMO4': '0.127', 'HITCOUNT': '0.150', 'WEAPON4': '0.300', 'weapon4': '0.386', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.600', 'ARMOR': '0.879', 'weapon3': '0.982', 'weapon2': '1.138', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:42:11,094][63770] DAMAGECOUNT value on done: 678.0 +[2023-09-14 14:42:11,632][63771] DAMAGECOUNT value on done: 753.0 +[2023-09-14 14:42:11,974][63771] DAMAGECOUNT value on done: 1161.0 +[2023-09-14 14:42:12,125][63769] DAMAGECOUNT value on done: 1227.0 +[2023-09-14 14:42:12,464][63769] DAMAGECOUNT value on done: 689.0 +[2023-09-14 14:42:15,268][63733] Updated weights for policy 1, policy_version 490 (0.0011) +[2023-09-14 14:42:15,411][63806] DAMAGECOUNT value on done: 1151.0 +[2023-09-14 14:42:15,412][63806] Sum rewards: -6.906, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.108', 'AMMO5': '0.010', 'AMMO2': '0.011', 'AMMO4': '0.053', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.201', 'DAMAGECOUNT': '0.309', 'weapon2': '0.960', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon3': '1.658'} +[2023-09-14 14:42:15,773][63806] DAMAGECOUNT value on done: 1140.0 +[2023-09-14 14:42:15,774][63806] Sum rewards: -4.436, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.382', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'AMMO2': '0.025', 'WEAPON5': '0.050', 'weapon5': '0.052', 'ARMOR': '0.072', 'AMMO4': '0.123', 'HITCOUNT': '0.150', 'AMMO3': '0.166', 'WEAPON4': '0.200', 'weapon4': '0.214', 'DAMAGECOUNT': '0.600', 'weapon3': '0.882', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.240'} +[2023-09-14 14:42:15,818][63806] DAMAGECOUNT value on done: 646.0 +[2023-09-14 14:42:16,106][63806] DAMAGECOUNT value on done: 1089.0 +[2023-09-14 14:42:16,107][63806] Sum rewards: -8.801, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.957', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'WEAPON5': '0.050', 'HITCOUNT': '0.050', 'AMMO4': '0.055', 'weapon5': '0.076', 'AMMO3': '0.110', 'DAMAGECOUNT': '0.153', 'WEAPON3': '0.550', 'weapon3': '0.838', 'FRAGCOUNT': '1.000', 'weapon2': '1.500'} +[2023-09-14 14:42:16,319][63732] Updated weights for policy 0, policy_version 430 (0.0010) +[2023-09-14 14:42:19,071][63734] DAMAGECOUNT value on done: 1393.0 +[2023-09-14 14:42:19,071][63734] Sum rewards: -6.370, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.378', 'AMMO2': '0.007', 'AMMO5': '0.007', 'ARMOR': '0.016', 'WEAPON1': '0.020', 'AMMO4': '0.034', 'weapon5': '0.090', 'HITCOUNT': '0.140', 'AMMO3': '0.147', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.519', 'WEAPON3': '0.750', 'weapon2': '0.936', 'weapon3': '1.192'} +[2023-09-14 14:42:19,509][63734] DAMAGECOUNT value on done: 1234.0 +[2023-09-14 14:42:19,509][63734] Sum rewards: -4.263, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.735', 'AMMO2': '0.024', 'ARMOR': '0.072', 'AMMO3': '0.109', 'AMMO4': '0.121', 'WEAPON4': '0.150', 'HITCOUNT': '0.190', 'weapon4': '0.540', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.774', 'weapon3': '0.902', 'weapon2': '1.290', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:42:20,084][63805] Large shaping reward -2.603 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', 0.05, 10.0), ('AMMO2', 0.0012000000000000001, 6.0), ('WEAPON3', -0.05, -1.0), ('AMMO3', -0.008, -16.0), ('AMMO4', 0.006, 6.0), ('WEAPON5', -0.05, -1.0), ('AMMO5', -0.0025, -5.0), ('AMMO6', -0.1, -100.0), ('WEAPON7', -0.1, -1.0), ('AMMO7', -0.1, -100.0)] +[2023-09-14 14:42:21,684][63770] DAMAGECOUNT value on done: 562.0 +[2023-09-14 14:42:22,081][63770] DAMAGECOUNT value on done: 1242.0 +[2023-09-14 14:42:22,082][63770] Sum rewards: -1.495, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.149', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'WEAPON4': '0.050', 'AMMO4': '0.057', 'weapon4': '0.080', 'AMMO3': '0.099', 'weapon5': '0.124', 'WEAPON5': '0.200', 'HITCOUNT': '0.220', 'WEAPON3': '0.550', 'DAMAGECOUNT': '1.005', 'weapon2': '1.100', 'weapon3': '1.138', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:42:22,117][63735] DAMAGECOUNT value on done: 1005.0 +[2023-09-14 14:42:22,118][63735] Sum rewards: -8.036, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.758', 'AMMO5': '0.010', 'ARMOR': '0.010', 'weapon5': '0.020', 'AMMO2': '0.038', 'weapon4': '0.090', 'AMMO3': '0.152', 'AMMO4': '0.188', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.720', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.204', 'weapon2': '1.510'} +[2023-09-14 14:42:22,480][63735] DAMAGECOUNT value on done: 1092.0 +[2023-09-14 14:42:22,481][63735] Sum rewards: -3.107, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.436', 'AMMO5': '0.005', 'AMMO2': '0.010', 'weapon5': '0.012', 'ARMOR': '0.028', 'AMMO4': '0.052', 'AMMO3': '0.094', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'weapon4': '0.210', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.114', 'weapon3': '1.164'} +[2023-09-14 14:42:22,649][63732] Updated weights for policy 0, policy_version 440 (0.0010) +[2023-09-14 14:42:22,930][63735] DAMAGECOUNT value on done: 1324.0 +[2023-09-14 14:42:22,930][63735] Sum rewards: -7.234, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.333', 'AMMO2': '0.010', 'weapon5': '0.012', 'AMMO5': '0.014', 'AMMO4': '0.049', 'ARMOR': '0.064', 'HITCOUNT': '0.070', 'AMMO3': '0.113', 'WEAPON4': '0.200', 'weapon4': '0.266', 'DAMAGECOUNT': '0.288', 'WEAPON5': '0.300', 'WEAPON3': '0.700', 'weapon2': '0.958', 'weapon3': '1.554'} +[2023-09-14 14:42:23,035][63769] DAMAGECOUNT value on done: 1121.0 +[2023-09-14 14:42:23,035][63769] Sum rewards: 0.126, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.534', 'AMMO5': '0.005', 'AMMO2': '0.006', 'weapon5': '0.008', 'ARMOR': '0.028', 'AMMO4': '0.032', 'weapon7': '0.062', 'AMMO3': '0.097', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'HITCOUNT': '0.120', 'weapon4': '0.220', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.495', 'weapon2': '1.098', 'weapon3': '1.338', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:42:23,217][63733] Updated weights for policy 1, policy_version 500 (0.0012) +[2023-09-14 14:42:23,285][63735] DAMAGECOUNT value on done: 1523.0 +[2023-09-14 14:42:23,285][63735] Sum rewards: -1.863, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.876', 'WEAPON1': '0.020', 'AMMO2': '0.020', 'ARMOR': '0.080', 'AMMO4': '0.100', 'AMMO3': '0.132', 'weapon4': '0.134', 'WEAPON4': '0.200', 'HITCOUNT': '0.240', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.936', 'weapon3': '1.214', 'weapon2': '1.336', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:42:23,459][63769] DAMAGECOUNT value on done: 920.0 +[2023-09-14 14:42:23,460][63769] Sum rewards: -1.385, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.638', 'AMMO5': '0.007', 'AMMO2': '0.018', 'ARMOR': '0.032', 'weapon5': '0.048', 'weapon7': '0.090', 'AMMO4': '0.091', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'AMMO3': '0.197', 'HITCOUNT': '0.200', 'weapon4': '0.314', 'weapon3': '0.882', 'DAMAGECOUNT': '0.981', 'WEAPON3': '1.000', 'weapon2': '1.342', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:42:23,679][63734] DAMAGECOUNT value on done: 910.0 +[2023-09-14 14:42:23,680][63734] Sum rewards: -1.943, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.692', 'AMMO2': '0.009', 'AMMO5': '0.017', 'weapon5': '0.040', 'AMMO4': '0.042', 'ARMOR': '0.064', 'AMMO3': '0.110', 'weapon4': '0.122', 'WEAPON5': '0.150', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.700', 'weapon2': '1.248', 'weapon3': '1.442', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:42:24,077][63734] DAMAGECOUNT value on done: 848.0 +[2023-09-14 14:42:24,078][63734] Sum rewards: -1.828, reward structure: {'DEATHCOUNT': '-5.250', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'AMMO2': '0.016', 'ARMOR': '0.025', 'weapon4': '0.038', 'HEALTH': '0.048', 'AMMO4': '0.078', 'HITCOUNT': '0.090', 'AMMO3': '0.091', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.124', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.450', 'weapon2': '1.208', 'weapon3': '1.264'} +[2023-09-14 14:42:24,133][63805] DAMAGECOUNT value on done: 1080.0 +[2023-09-14 14:42:24,134][63805] Sum rewards: -11.835, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.780', 'FRAGCOUNT': '-2.000', 'AMMO2': '0.005', 'AMMO5': '0.006', 'WEAPON1': '0.020', 'AMMO4': '0.026', 'ARMOR': '0.036', 'weapon4': '0.048', 'weapon5': '0.052', 'WEAPON4': '0.100', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'HITCOUNT': '0.120', 'WEAPON5': '0.150', 'AMMO3': '0.229', 'DAMAGECOUNT': '0.480', 'WEAPON3': '1.300', 'weapon3': '1.378', 'weapon2': '1.444'} +[2023-09-14 14:42:24,461][63805] DAMAGECOUNT value on done: 1385.0 +[2023-09-14 14:42:24,461][63805] Sum rewards: -5.140, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.630', 'WEAPON1': '0.010', 'AMMO5': '0.016', 'AMMO2': '0.026', 'ARMOR': '0.028', 'weapon5': '0.092', 'HITCOUNT': '0.110', 'AMMO3': '0.121', 'AMMO4': '0.132', 'WEAPON4': '0.250', 'WEAPON5': '0.250', 'weapon4': '0.394', 'DAMAGECOUNT': '0.441', 'WEAPON3': '0.650', 'weapon3': '0.938', 'weapon2': '1.282', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:42:26,748][63767] DAMAGECOUNT value on done: 937.0 +[2023-09-14 14:42:26,748][63767] Sum rewards: -0.674, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.244', 'AMMO5': '0.007', 'AMMO2': '0.027', 'weapon5': '0.032', 'HITCOUNT': '0.120', 'AMMO3': '0.127', 'AMMO4': '0.134', 'WEAPON5': '0.150', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.357', 'weapon4': '0.386', 'ARMOR': '0.448', 'WEAPON3': '0.700', 'weapon3': '0.748', 'weapon2': '1.484', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:42:27,133][63767] DAMAGECOUNT value on done: 1264.0 +[2023-09-14 14:42:27,133][63767] Sum rewards: -6.243, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.916', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.049', 'WEAPON5': '0.050', 'weapon5': '0.092', 'AMMO3': '0.119', 'HITCOUNT': '0.170', 'WEAPON4': '0.250', 'weapon4': '0.390', 'ARMOR': '0.456', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.714', 'weapon3': '0.966', 'weapon2': '1.202'} +[2023-09-14 14:42:27,466][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000505_2068480.pth... +[2023-09-14 14:42:27,466][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000447_1830912.pth... +[2023-09-14 14:42:27,526][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000151_618496.pth +[2023-09-14 14:42:27,533][63576] Saving new best policy, reward=-5.477! +[2023-09-14 14:42:27,539][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000134_548864.pth +[2023-09-14 14:42:28,611][63771] DAMAGECOUNT value on done: 1205.0 +[2023-09-14 14:42:28,939][63732] Updated weights for policy 0, policy_version 450 (0.0010) +[2023-09-14 14:42:29,074][63771] DAMAGECOUNT value on done: 1316.0 +[2023-09-14 14:42:29,075][63771] Sum rewards: -2.872, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.170', 'AMMO2': '0.014', 'ARMOR': '0.044', 'AMMO4': '0.072', 'WEAPON4': '0.150', 'AMMO3': '0.197', 'weapon4': '0.200', 'HITCOUNT': '0.260', 'WEAPON3': '0.700', 'weapon3': '1.050', 'DAMAGECOUNT': '1.053', 'weapon2': '1.308', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:42:30,469][63805] DAMAGECOUNT value on done: 781.0 +[2023-09-14 14:42:30,731][63767] DAMAGECOUNT value on done: 1897.0 +[2023-09-14 14:42:30,732][63767] Sum rewards: -5.202, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.774', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'AMMO5': '0.003', 'AMMO3': '0.157', 'HITCOUNT': '0.180', 'DAMAGECOUNT': '0.747', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.348', 'weapon2': '1.384'} +[2023-09-14 14:42:30,794][63805] DAMAGECOUNT value on done: 1204.0 +[2023-09-14 14:42:30,794][63805] Sum rewards: -2.883, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.780', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.003', 'weapon5': '0.036', 'WEAPON1': '0.040', 'WEAPON5': '0.050', 'AMMO3': '0.068', 'HITCOUNT': '0.070', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.100', 'DAMAGECOUNT': '0.180', 'WEAPON3': '0.400', 'weapon2': '0.952', 'FRAGCOUNT': '1.000', 'weapon3': '1.462'} +[2023-09-14 14:42:31,061][63767] DAMAGECOUNT value on done: 1473.0 +[2023-09-14 14:42:31,201][63733] Updated weights for policy 1, policy_version 510 (0.0011) +[2023-09-14 14:42:32,462][63576] Saving new best policy, reward=-5.324! +[2023-09-14 14:42:33,661][63770] DAMAGECOUNT value on done: 756.0 +[2023-09-14 14:42:33,662][63770] Sum rewards: -9.677, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.970', 'AMMO5': '0.005', 'AMMO2': '0.005', 'ARMOR': '0.020', 'AMMO4': '0.026', 'HITCOUNT': '0.050', 'weapon4': '0.074', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.155', 'DAMAGECOUNT': '0.165', 'WEAPON3': '0.800', 'weapon3': '0.948', 'FRAGCOUNT': '1.000', 'weapon2': '1.594'} +[2023-09-14 14:42:34,038][63770] DAMAGECOUNT value on done: 941.0 +[2023-09-14 14:42:34,039][63770] Sum rewards: -1.617, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO2': '0.002', 'AMMO5': '0.007', 'AMMO4': '0.009', 'weapon5': '0.082', 'AMMO3': '0.130', 'WEAPON5': '0.150', 'HEALTH': '0.176', 'HITCOUNT': '0.180', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.789', 'FRAGCOUNT': '1.000', 'weapon2': '1.160', 'weapon3': '1.548'} +[2023-09-14 14:42:34,301][63771] DAMAGECOUNT value on done: 970.0 +[2023-09-14 14:42:34,301][63771] Sum rewards: -5.358, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.598', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'AMMO5': '0.005', 'weapon5': '0.016', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'ARMOR': '0.052', 'weapon4': '0.090', 'AMMO3': '0.095', 'HITCOUNT': '0.220', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.651', 'FRAGCOUNT': '1.000', 'weapon2': '1.228', 'weapon3': '1.348'} +[2023-09-14 14:42:34,688][63771] DAMAGECOUNT value on done: 1246.0 +[2023-09-14 14:42:34,901][63769] DAMAGECOUNT value on done: 1342.0 +[2023-09-14 14:42:34,901][63769] Sum rewards: -6.298, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.920', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.008', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'HITCOUNT': '0.120', 'weapon4': '0.122', 'AMMO3': '0.158', 'DAMAGECOUNT': '0.345', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.010', 'weapon3': '1.670'} +[2023-09-14 14:42:35,278][63769] DAMAGECOUNT value on done: 748.0 +[2023-09-14 14:42:35,278][63769] Sum rewards: -1.147, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.980', 'AMMO5': '0.005', 'AMMO2': '0.008', 'WEAPON1': '0.020', 'AMMO4': '0.041', 'weapon5': '0.048', 'HITCOUNT': '0.050', 'AMMO3': '0.063', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.104', 'DAMAGECOUNT': '0.177', 'WEAPON3': '0.400', 'ARMOR': '0.472', 'FRAGCOUNT': '1.000', 'weapon3': '1.230', 'weapon2': '1.264'} +[2023-09-14 14:42:35,298][63732] Updated weights for policy 0, policy_version 460 (0.0011) +[2023-09-14 14:42:37,857][63806] DAMAGECOUNT value on done: 1299.0 +[2023-09-14 14:42:37,857][63806] Sum rewards: -7.312, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.190', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.012', 'AMMO5': '0.013', 'AMMO4': '0.062', 'ARMOR': '0.064', 'weapon5': '0.076', 'HITCOUNT': '0.120', 'weapon4': '0.170', 'AMMO3': '0.176', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.444', 'WEAPON3': '0.800', 'weapon3': '1.052', 'weapon2': '1.388'} +[2023-09-14 14:42:38,138][63806] DAMAGECOUNT value on done: 1440.0 +[2023-09-14 14:42:38,138][63806] Sum rewards: -3.615, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.870', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'AMMO2': '0.015', 'weapon7': '0.060', 'AMMO4': '0.074', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.100', 'AMMO3': '0.139', 'HITCOUNT': '0.160', 'weapon4': '0.172', 'WEAPON4': '0.200', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.900', 'weapon2': '1.130', 'weapon3': '1.250'} +[2023-09-14 14:42:38,184][63806] DAMAGECOUNT value on done: 813.0 +[2023-09-14 14:42:38,184][63806] Sum rewards: -3.809, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.172', 'AMMO5': '0.003', 'AMMO2': '0.009', 'ARMOR': '0.024', 'AMMO4': '0.044', 'WEAPON5': '0.050', 'AMMO3': '0.114', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.501', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.384', 'weapon2': '1.424'} +[2023-09-14 14:42:38,543][63806] DAMAGECOUNT value on done: 1173.0 +[2023-09-14 14:42:38,544][63806] Sum rewards: -11.490, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-2.946', 'AMMO5': '0.013', 'AMMO2': '0.015', 'ARMOR': '0.060', 'AMMO4': '0.072', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'weapon4': '0.116', 'AMMO3': '0.232', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.252', 'FRAGCOUNT': '1.000', 'weapon3': '1.082', 'WEAPON3': '1.150', 'weapon2': '1.274'} +[2023-09-14 14:42:39,354][63733] Updated weights for policy 1, policy_version 520 (0.0011) +[2023-09-14 14:42:41,599][63732] Updated weights for policy 0, policy_version 470 (0.0011) +[2023-09-14 14:42:44,383][63734] DAMAGECOUNT value on done: 1453.0 +[2023-09-14 14:42:44,383][63734] Sum rewards: -8.302, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.562', 'AMMO5': '0.004', 'weapon4': '0.012', 'AMMO2': '0.012', 'weapon5': '0.034', 'WEAPON4': '0.050', 'AMMO4': '0.061', 'HITCOUNT': '0.070', 'WEAPON5': '0.100', 'AMMO3': '0.158', 'DAMAGECOUNT': '0.180', 'ARMOR': '0.452', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.900', 'weapon2': '1.354', 'weapon3': '1.372'} +[2023-09-14 14:42:44,777][63770] DAMAGECOUNT value on done: 577.0 +[2023-09-14 14:42:44,794][63734] DAMAGECOUNT value on done: 1562.0 +[2023-09-14 14:42:44,795][63734] Sum rewards: -1.245, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.793', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.019', 'ARMOR': '0.036', 'AMMO4': '0.095', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.163', 'HITCOUNT': '0.220', 'weapon2': '0.696', 'DAMAGECOUNT': '0.984', 'WEAPON3': '1.000', 'weapon3': '1.870', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:42:45,014][63735] DAMAGECOUNT value on done: 1561.0 +[2023-09-14 14:42:45,014][63735] Sum rewards: -2.968, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.582', 'AMMO2': '0.008', 'AMMO4': '0.041', 'WEAPON4': '0.050', 'ARMOR': '0.116', 'AMMO3': '0.156', 'HITCOUNT': '0.170', 'weapon4': '0.290', 'DAMAGECOUNT': '0.711', 'WEAPON3': '0.800', 'weapon2': '0.990', 'weapon3': '1.282', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:42:45,101][63770] DAMAGECOUNT value on done: 1367.0 +[2023-09-14 14:42:45,102][63770] Sum rewards: -6.046, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.859', 'AMMO2': '0.002', 'AMMO4': '0.009', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'weapon4': '0.086', 'HITCOUNT': '0.110', 'AMMO3': '0.151', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.012', 'weapon3': '1.636'} +[2023-09-14 14:42:45,355][63735] DAMAGECOUNT value on done: 1623.0 +[2023-09-14 14:42:46,384][63735] DAMAGECOUNT value on done: 1055.0 +[2023-09-14 14:42:46,385][63735] Sum rewards: -5.626, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.330', 'AMMO5': '0.008', 'AMMO2': '0.009', 'WEAPON1': '0.020', 'HITCOUNT': '0.040', 'AMMO4': '0.043', 'weapon5': '0.044', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'weapon4': '0.100', 'AMMO3': '0.110', 'DAMAGECOUNT': '0.150', 'ARMOR': '0.509', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.044', 'weapon2': '1.578'} +[2023-09-14 14:42:46,769][63735] DAMAGECOUNT value on done: 1122.0 +[2023-09-14 14:42:46,769][63735] Sum rewards: -4.885, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.160', 'AMMO2': '0.026', 'HITCOUNT': '0.030', 'DAMAGECOUNT': '0.090', 'AMMO4': '0.128', 'AMMO3': '0.162', 'ARMOR': '0.441', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.066', 'weapon3': '1.782'} +[2023-09-14 14:42:47,359][63805] DAMAGECOUNT value on done: 1280.0 +[2023-09-14 14:42:47,360][63805] Sum rewards: -11.179, reward structure: {'DEATHCOUNT': '-14.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.835', 'AMMO5': '0.008', 'WEAPON1': '0.010', 'ARMOR': '0.016', 'AMMO2': '0.032', 'weapon5': '0.070', 'weapon4': '0.074', 'WEAPON5': '0.150', 'AMMO4': '0.162', 'AMMO3': '0.175', 'HITCOUNT': '0.190', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.950', 'weapon3': '1.174', 'weapon2': '1.494'} +[2023-09-14 14:42:47,431][63733] Updated weights for policy 1, policy_version 530 (0.0010) +[2023-09-14 14:42:47,540][63734] DAMAGECOUNT value on done: 940.0 +[2023-09-14 14:42:47,712][63805] DAMAGECOUNT value on done: 1645.0 +[2023-09-14 14:42:47,713][63805] Sum rewards: -7.892, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.710', 'AMMO5': '0.013', 'AMMO2': '0.024', 'WEAPON1': '0.030', 'weapon5': '0.046', 'AMMO3': '0.111', 'AMMO4': '0.120', 'HITCOUNT': '0.120', 'WEAPON5': '0.200', 'weapon4': '0.218', 'WEAPON4': '0.250', 'ARMOR': '0.445', 'WEAPON3': '0.600', 'weapon3': '0.648', 'DAMAGECOUNT': '0.780', 'FRAGCOUNT': '1.500', 'weapon2': '1.712'} +[2023-09-14 14:42:47,900][63734] DAMAGECOUNT value on done: 878.0 +[2023-09-14 14:42:47,900][63734] Sum rewards: -8.083, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-3.000', 'HEALTH': '-2.230', 'AMMO2': '0.020', 'WEAPON1': '0.020', 'HITCOUNT': '0.020', 'AMMO5': '0.021', 'DAMAGECOUNT': '0.090', 'AMMO4': '0.099', 'AMMO3': '0.119', 'weapon4': '0.120', 'weapon5': '0.138', 'WEAPON4': '0.300', 'WEAPON5': '0.350', 'ARMOR': '0.492', 'WEAPON3': '0.700', 'weapon3': '0.866', 'weapon2': '1.292'} +[2023-09-14 14:42:47,914][63769] DAMAGECOUNT value on done: 1161.0 +[2023-09-14 14:42:48,002][63732] Updated weights for policy 0, policy_version 480 (0.0012) +[2023-09-14 14:42:48,400][63769] DAMAGECOUNT value on done: 1030.0 +[2023-09-14 14:42:48,400][63769] Sum rewards: -5.927, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.814', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.007', 'AMMO2': '0.021', 'weapon5': '0.046', 'HITCOUNT': '0.100', 'AMMO4': '0.102', 'ARMOR': '0.116', 'WEAPON5': '0.150', 'AMMO3': '0.151', 'WEAPON4': '0.200', 'weapon4': '0.220', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.850', 'weapon2': '1.042', 'weapon3': '1.302'} +[2023-09-14 14:42:49,532][63767] DAMAGECOUNT value on done: 1012.0 +[2023-09-14 14:42:49,910][63767] DAMAGECOUNT value on done: 1309.0 +[2023-09-14 14:42:49,910][63767] Sum rewards: -5.008, reward structure: {'DEATHCOUNT': '-6.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.115', 'AMMO5': '0.007', 'AMMO2': '0.018', 'ARMOR': '0.040', 'HITCOUNT': '0.040', 'weapon5': '0.040', 'weapon4': '0.072', 'AMMO4': '0.088', 'AMMO3': '0.099', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.135', 'WEAPON5': '0.150', 'WEAPON3': '0.500', 'weapon2': '0.932', 'weapon3': '1.386'} +[2023-09-14 14:42:53,021][63767] DAMAGECOUNT value on done: 1980.0 +[2023-09-14 14:42:53,115][63805] DAMAGECOUNT value on done: 881.0 +[2023-09-14 14:42:53,115][63805] Sum rewards: -8.924, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.412', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.003', 'weapon4': '0.004', 'AMMO2': '0.016', 'ARMOR': '0.036', 'weapon6': '0.046', 'weapon5': '0.046', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.077', 'HITCOUNT': '0.090', 'AMMO3': '0.140', 'AMMO6': '0.198', 'AMMO7': '0.198', 'WEAPON6': '0.200', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.800', 'weapon3': '0.902', 'weapon2': '1.582'} +[2023-09-14 14:42:53,389][63767] DAMAGECOUNT value on done: 1618.0 +[2023-09-14 14:42:53,389][63767] Sum rewards: -4.987, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.807', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO2': '0.013', 'ARMOR': '0.032', 'AMMO4': '0.062', 'WEAPON5': '0.100', 'AMMO3': '0.137', 'HITCOUNT': '0.140', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.750', 'weapon2': '1.050', 'weapon3': '1.840'} +[2023-09-14 14:42:53,437][63805] DAMAGECOUNT value on done: 1269.0 +[2023-09-14 14:42:53,437][63805] Sum rewards: -10.534, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.222', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.019', 'ARMOR': '0.024', 'weapon4': '0.046', 'HITCOUNT': '0.070', 'AMMO4': '0.095', 'WEAPON5': '0.100', 'AMMO3': '0.134', 'DAMAGECOUNT': '0.195', 'WEAPON4': '0.200', 'WEAPON3': '0.650', 'weapon3': '0.808', 'FRAGCOUNT': '1.000', 'weapon2': '1.832'} +[2023-09-14 14:42:53,733][63771] DAMAGECOUNT value on done: 1246.0 +[2023-09-14 14:42:53,733][63771] Sum rewards: -10.158, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.575', 'FRAGCOUNT': '-1.500', 'AMMO2': '0.004', 'AMMO5': '0.010', 'weapon5': '0.018', 'AMMO4': '0.019', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'HITCOUNT': '0.040', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.123', 'weapon4': '0.188', 'WEAPON5': '0.200', 'AMMO3': '0.220', 'weapon3': '1.066', 'WEAPON3': '1.100', 'weapon2': '1.270'} +[2023-09-14 14:42:54,108][63771] DAMAGECOUNT value on done: 1598.0 +[2023-09-14 14:42:54,109][63771] Sum rewards: -2.524, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.130', 'AMMO5': '0.005', 'AMMO2': '0.006', 'weapon5': '0.022', 'AMMO4': '0.031', 'ARMOR': '0.036', 'AMMO3': '0.098', 'WEAPON5': '0.100', 'WEAPON4': '0.200', 'HITCOUNT': '0.210', 'weapon4': '0.262', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.846', 'weapon3': '1.152', 'weapon2': '1.288', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:42:54,260][63732] Updated weights for policy 0, policy_version 490 (0.0010) +[2023-09-14 14:42:55,560][63733] Updated weights for policy 1, policy_version 540 (0.0010) +[2023-09-14 14:42:56,794][63770] DAMAGECOUNT value on done: 1111.0 +[2023-09-14 14:42:56,795][63770] Sum rewards: 2.252, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.460', 'AMMO5': '0.005', 'AMMO2': '0.024', 'weapon5': '0.044', 'ARMOR': '0.050', 'AMMO3': '0.092', 'WEAPON5': '0.100', 'AMMO4': '0.121', 'weapon4': '0.126', 'WEAPON4': '0.150', 'HITCOUNT': '0.310', 'WEAPON3': '0.550', 'weapon2': '1.032', 'DAMAGECOUNT': '1.065', 'weapon3': '1.542', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:42:57,125][63770] DAMAGECOUNT value on done: 976.0 +[2023-09-14 14:42:57,235][63771] DAMAGECOUNT value on done: 990.0 +[2023-09-14 14:42:57,236][63771] Sum rewards: -8.750, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.207', 'AMMO2': '0.002', 'AMMO5': '0.007', 'ARMOR': '0.008', 'AMMO4': '0.010', 'HITCOUNT': '0.020', 'weapon5': '0.052', 'DAMAGECOUNT': '0.060', 'WEAPON5': '0.100', 'AMMO3': '0.167', 'WEAPON3': '0.900', 'weapon2': '1.014', 'weapon3': '1.366'} +[2023-09-14 14:42:57,467][63454] Saving new best policy, reward=-5.809! +[2023-09-14 14:42:57,595][63771] DAMAGECOUNT value on done: 1276.0 +[2023-09-14 14:42:57,626][63769] DAMAGECOUNT value on done: 1511.0 +[2023-09-14 14:42:57,627][63769] Sum rewards: -1.433, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.222', 'AMMO5': '0.007', 'AMMO2': '0.010', 'WEAPON1': '0.020', 'weapon5': '0.030', 'AMMO4': '0.051', 'WEAPON5': '0.100', 'AMMO3': '0.111', 'HITCOUNT': '0.120', 'WEAPON4': '0.150', 'weapon4': '0.164', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.700', 'weapon2': '0.918', 'weapon3': '1.400', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:42:58,008][63769] DAMAGECOUNT value on done: 808.0 +[2023-09-14 14:43:00,159][63806] DAMAGECOUNT value on done: 1518.0 +[2023-09-14 14:43:00,159][63806] Sum rewards: -0.143, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.292', 'AMMO5': '0.010', 'weapon5': '0.012', 'AMMO2': '0.015', 'weapon4': '0.022', 'HITCOUNT': '0.060', 'AMMO4': '0.076', 'ARMOR': '0.084', 'weapon7': '0.084', 'AMMO3': '0.091', 'WEAPON5': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.657', 'weapon2': '1.250', 'weapon3': '1.448', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:43:00,462][63806] DAMAGECOUNT value on done: 1610.0 +[2023-09-14 14:43:00,463][63806] Sum rewards: -2.034, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.648', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'weapon5': '0.026', 'AMMO2': '0.026', 'HITCOUNT': '0.050', 'ARMOR': '0.072', 'weapon7': '0.078', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.128', 'AMMO4': '0.130', 'WEAPON4': '0.250', 'WEAPON5': '0.300', 'weapon4': '0.354', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.700', 'weapon3': '0.972', 'FRAGCOUNT': '1.000', 'weapon2': '1.182'} +[2023-09-14 14:43:00,507][63806] DAMAGECOUNT value on done: 922.0 +[2023-09-14 14:43:00,508][63806] Sum rewards: -9.072, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.950', 'AMMO2': '0.010', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.047', 'ARMOR': '0.076', 'weapon5': '0.082', 'WEAPON4': '0.100', 'weapon4': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.165', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.327', 'WEAPON3': '0.900', 'weapon2': '1.216', 'weapon3': '1.224', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:43:00,614][63732] Updated weights for policy 0, policy_version 500 (0.0010) +[2023-09-14 14:43:00,845][63806] DAMAGECOUNT value on done: 1368.0 +[2023-09-14 14:43:00,846][63806] Sum rewards: -4.365, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.480', 'AMMO5': '0.010', 'weapon5': '0.026', 'AMMO2': '0.034', 'weapon7': '0.058', 'AMMO3': '0.089', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO4': '0.169', 'WEAPON3': '0.400', 'WEAPON4': '0.450', 'weapon4': '0.486', 'DAMAGECOUNT': '0.585', 'weapon3': '0.616', 'weapon2': '1.432', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:43:02,461][63454] Saving new best policy, reward=-5.679! +[2023-09-14 14:43:03,694][63733] Updated weights for policy 1, policy_version 550 (0.0011) +[2023-09-14 14:43:07,007][63732] Updated weights for policy 0, policy_version 510 (0.0011) +[2023-09-14 14:43:07,364][63735] DAMAGECOUNT value on done: 1942.0 +[2023-09-14 14:43:07,365][63735] Sum rewards: -1.330, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.405', 'AMMO2': '0.010', 'AMMO5': '0.011', 'weapon5': '0.034', 'AMMO4': '0.048', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO3': '0.091', 'weapon4': '0.116', 'HITCOUNT': '0.180', 'WEAPON5': '0.250', 'WEAPON3': '0.550', 'weapon2': '1.140', 'DAMAGECOUNT': '1.143', 'weapon3': '1.388', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:43:07,731][63735] DAMAGECOUNT value on done: 1750.0 +[2023-09-14 14:43:07,731][63735] Sum rewards: -6.211, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.038', 'AMMO5': '0.005', 'AMMO2': '0.032', 'HITCOUNT': '0.080', 'WEAPON5': '0.100', 'AMMO3': '0.150', 'AMMO4': '0.159', 'WEAPON4': '0.250', 'weapon4': '0.250', 'DAMAGECOUNT': '0.381', 'ARMOR': '0.488', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.236', 'weapon3': '1.246'} +[2023-09-14 14:43:07,956][63770] DAMAGECOUNT value on done: 622.0 +[2023-09-14 14:43:08,348][63770] DAMAGECOUNT value on done: 1517.0 +[2023-09-14 14:43:08,349][63770] Sum rewards: -3.183, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.524', 'AMMO2': '0.017', 'AMMO4': '0.083', 'AMMO3': '0.105', 'ARMOR': '0.108', 'HITCOUNT': '0.150', 'weapon4': '0.200', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.600', 'weapon3': '1.226', 'weapon2': '1.352', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:43:09,604][63734] DAMAGECOUNT value on done: 1487.0 +[2023-09-14 14:43:09,949][63734] DAMAGECOUNT value on done: 1614.0 +[2023-09-14 14:43:10,565][63805] DAMAGECOUNT value on done: 1325.0 +[2023-09-14 14:43:10,881][63735] DAMAGECOUNT value on done: 1085.0 +[2023-09-14 14:43:10,882][63735] Sum rewards: -6.424, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.720', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.024', 'HITCOUNT': '0.030', 'ARMOR': '0.040', 'AMMO3': '0.083', 'DAMAGECOUNT': '0.090', 'WEAPON5': '0.100', 'AMMO4': '0.120', 'WEAPON4': '0.250', 'weapon4': '0.394', 'WEAPON3': '0.450', 'weapon3': '0.846', 'FRAGCOUNT': '1.000', 'weapon2': '1.604'} +[2023-09-14 14:43:10,934][63805] DAMAGECOUNT value on done: 1890.0 +[2023-09-14 14:43:10,935][63805] Sum rewards: -4.485, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.904', 'AMMO5': '0.012', 'weapon5': '0.016', 'AMMO2': '0.026', 'weapon7': '0.064', 'ARMOR': '0.068', 'AMMO4': '0.128', 'weapon4': '0.130', 'AMMO3': '0.132', 'HITCOUNT': '0.150', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.735', 'WEAPON3': '0.800', 'weapon2': '1.256', 'weapon3': '1.432', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:43:11,063][63734] DAMAGECOUNT value on done: 1024.0 +[2023-09-14 14:43:11,064][63734] Sum rewards: -2.125, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO5': '0.008', 'AMMO2': '0.021', 'ARMOR': '0.036', 'AMMO3': '0.075', 'weapon5': '0.096', 'HITCOUNT': '0.100', 'AMMO4': '0.107', 'HEALTH': '0.138', 'WEAPON5': '0.150', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.252', 'WEAPON3': '0.400', 'weapon4': '0.468', 'FRAGCOUNT': '0.500', 'weapon3': '0.764', 'weapon2': '1.260'} +[2023-09-14 14:43:11,281][63735] DAMAGECOUNT value on done: 1176.0 +[2023-09-14 14:43:11,472][63734] DAMAGECOUNT value on done: 968.0 +[2023-09-14 14:43:11,473][63734] Sum rewards: -7.987, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.800', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.003', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'AMMO4': '0.046', 'WEAPON5': '0.050', 'ARMOR': '0.052', 'weapon5': '0.062', 'HITCOUNT': '0.080', 'AMMO3': '0.115', 'WEAPON4': '0.150', 'weapon4': '0.210', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.650', 'weapon3': '0.652', 'weapon2': '1.704'} +[2023-09-14 14:43:11,773][63733] Updated weights for policy 1, policy_version 560 (0.0012) +[2023-09-14 14:43:12,461][63454] Saving new best policy, reward=-5.530! +[2023-09-14 14:43:12,608][63767] DAMAGECOUNT value on done: 1143.0 +[2023-09-14 14:43:12,609][63767] Sum rewards: -3.563, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.780', 'AMMO2': '0.011', 'AMMO5': '0.018', 'WEAPON1': '0.040', 'AMMO4': '0.057', 'weapon4': '0.062', 'ARMOR': '0.080', 'HITCOUNT': '0.100', 'weapon5': '0.100', 'AMMO3': '0.110', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.393', 'WEAPON5': '0.400', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.198', 'weapon3': '1.248'} +[2023-09-14 14:43:13,004][63767] DAMAGECOUNT value on done: 1314.0 +[2023-09-14 14:43:13,005][63767] Sum rewards: -6.913, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.643', 'AMMO5': '0.003', 'weapon5': '0.008', 'AMMO2': '0.009', 'HITCOUNT': '0.010', 'DAMAGECOUNT': '0.015', 'ARMOR': '0.040', 'AMMO4': '0.045', 'WEAPON5': '0.050', 'WEAPON4': '0.100', 'AMMO3': '0.106', 'weapon4': '0.180', 'WEAPON3': '0.450', 'weapon3': '0.884', 'weapon2': '1.580'} +[2023-09-14 14:43:13,192][63769] DAMAGECOUNT value on done: 1236.0 +[2023-09-14 14:43:13,356][63732] Updated weights for policy 0, policy_version 520 (0.0011) +[2023-09-14 14:43:13,624][63769] DAMAGECOUNT value on done: 1150.0 +[2023-09-14 14:43:13,624][63769] Sum rewards: -0.859, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.430', 'AMMO5': '0.003', 'HITCOUNT': '0.010', 'AMMO2': '0.020', 'WEAPON1': '0.020', 'ARMOR': '0.050', 'weapon5': '0.066', 'AMMO3': '0.079', 'AMMO4': '0.097', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.180', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.400', 'weapon3': '0.994', 'FRAGCOUNT': '1.000', 'weapon2': '1.342'} +[2023-09-14 14:43:15,604][63805] DAMAGECOUNT value on done: 1066.0 +[2023-09-14 14:43:15,605][63805] Sum rewards: -6.721, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.684', 'weapon5': '0.002', 'AMMO5': '0.005', 'ARMOR': '0.025', 'AMMO2': '0.026', 'WEAPON5': '0.100', 'AMMO4': '0.127', 'HITCOUNT': '0.150', 'AMMO3': '0.177', 'weapon4': '0.184', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.750', 'weapon2': '1.276', 'weapon3': '1.336', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:43:15,756][63767] DAMAGECOUNT value on done: 2015.0 +[2023-09-14 14:43:15,997][63805] DAMAGECOUNT value on done: 1499.0 +[2023-09-14 14:43:15,997][63805] Sum rewards: -6.193, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.295', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'ARMOR': '0.020', 'weapon5': '0.040', 'WEAPON4': '0.050', 'weapon4': '0.080', 'AMMO3': '0.092', 'HITCOUNT': '0.120', 'WEAPON5': '0.250', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.690', 'weapon3': '0.908', 'weapon2': '1.336', 'FRAGCOUNT': '1.500'} +[2023-09-14 14:43:16,125][63767] DAMAGECOUNT value on done: 1648.0 +[2023-09-14 14:43:16,126][63767] Sum rewards: -5.379, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.290', 'AMMO5': '0.003', 'AMMO2': '0.005', 'weapon5': '0.006', 'AMMO4': '0.027', 'HITCOUNT': '0.030', 'WEAPON5': '0.050', 'DAMAGECOUNT': '0.090', 'AMMO3': '0.160', 'WEAPON3': '0.800', 'weapon2': '0.870', 'FRAGCOUNT': '1.000', 'weapon3': '1.620'} +[2023-09-14 14:43:17,465][63454] Saving new best policy, reward=-5.486! +[2023-09-14 14:43:18,850][63771] DAMAGECOUNT value on done: 1276.0 +[2023-09-14 14:43:19,280][63771] DAMAGECOUNT value on done: 1886.0 +[2023-09-14 14:43:19,281][63771] Sum rewards: -7.162, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.760', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO4': '0.027', 'ARMOR': '0.032', 'weapon5': '0.044', 'WEAPON5': '0.100', 'HITCOUNT': '0.120', 'weapon4': '0.164', 'WEAPON4': '0.200', 'AMMO3': '0.203', 'DAMAGECOUNT': '0.864', 'WEAPON3': '1.050', 'weapon3': '1.340', 'weapon2': '1.444', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:43:19,644][63732] Updated weights for policy 0, policy_version 530 (0.0011) +[2023-09-14 14:43:19,767][63770] DAMAGECOUNT value on done: 1288.0 +[2023-09-14 14:43:19,957][63733] Updated weights for policy 1, policy_version 570 (0.0012) +[2023-09-14 14:43:20,080][63770] DAMAGECOUNT value on done: 1141.0 +[2023-09-14 14:43:20,344][63771] DAMAGECOUNT value on done: 1050.0 +[2023-09-14 14:43:20,344][63771] Sum rewards: -10.177, reward structure: {'DEATHCOUNT': '-11.250', 'FRAGCOUNT': '-2.000', 'HEALTH': '-0.968', 'AMMO5': '0.007', 'AMMO2': '0.010', 'HITCOUNT': '0.050', 'AMMO4': '0.051', 'weapon5': '0.070', 'WEAPON5': '0.150', 'AMMO3': '0.157', 'DAMAGECOUNT': '0.180', 'weapon2': '0.888', 'WEAPON3': '0.900', 'weapon3': '1.578'} +[2023-09-14 14:43:20,614][63769] DAMAGECOUNT value on done: 1671.0 +[2023-09-14 14:43:20,614][63769] Sum rewards: -6.698, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.390', 'AMMO2': '0.013', 'weapon4': '0.024', 'AMMO4': '0.065', 'AMMO3': '0.110', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.116', 'weapon2': '1.534'} +[2023-09-14 14:43:20,715][63771] DAMAGECOUNT value on done: 1326.0 +[2023-09-14 14:43:20,715][63771] Sum rewards: -4.602, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.840', 'AMMO4': '-0.024', 'AMMO2': '-0.005', 'HITCOUNT': '0.060', 'DAMAGECOUNT': '0.150', 'AMMO3': '0.183', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.182', 'weapon3': '1.442'} +[2023-09-14 14:43:20,991][63769] DAMAGECOUNT value on done: 951.0 +[2023-09-14 14:43:20,992][63769] Sum rewards: -6.496, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.094', 'AMMO2': '0.012', 'ARMOR': '0.052', 'AMMO4': '0.059', 'HITCOUNT': '0.090', 'AMMO3': '0.124', 'WEAPON4': '0.150', 'weapon4': '0.284', 'DAMAGECOUNT': '0.429', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.084', 'weapon3': '1.164'} +[2023-09-14 14:43:22,691][63806] DAMAGECOUNT value on done: 1533.0 +[2023-09-14 14:43:23,008][63806] DAMAGECOUNT value on done: 1883.0 +[2023-09-14 14:43:23,009][63806] Sum rewards: 1.081, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.777', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'AMMO5': '0.013', 'weapon4': '0.038', 'AMMO4': '0.053', 'weapon5': '0.054', 'AMMO3': '0.082', 'WEAPON4': '0.100', 'HITCOUNT': '0.150', 'WEAPON5': '0.250', 'WEAPON3': '0.450', 'ARMOR': '0.493', 'DAMAGECOUNT': '0.819', 'weapon2': '1.146', 'weapon3': '1.440', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:43:23,058][63806] DAMAGECOUNT value on done: 1042.0 +[2023-09-14 14:43:23,058][63806] Sum rewards: -2.259, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.005', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'ARMOR': '0.012', 'HEALTH': '0.018', 'AMMO4': '0.040', 'weapon5': '0.050', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.129', 'HITCOUNT': '0.130', 'weapon4': '0.194', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.600', 'weapon2': '0.908', 'FRAGCOUNT': '1.000', 'weapon3': '1.576'} +[2023-09-14 14:43:23,406][63806] DAMAGECOUNT value on done: 1418.0 +[2023-09-14 14:43:25,955][63732] Updated weights for policy 0, policy_version 540 (0.0010) +[2023-09-14 14:43:27,941][63733] Updated weights for policy 1, policy_version 580 (0.0012) +[2023-09-14 14:43:29,680][63735] DAMAGECOUNT value on done: 2047.0 +[2023-09-14 14:43:29,680][63735] Sum rewards: -5.926, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.514', 'AMMO5': '0.005', 'AMMO2': '0.038', 'ARMOR': '0.048', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.174', 'AMMO4': '0.192', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.315', 'weapon4': '0.426', 'WEAPON3': '0.850', 'weapon2': '0.918', 'weapon3': '1.412', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:43:30,005][63735] DAMAGECOUNT value on done: 1990.0 +[2023-09-14 14:43:30,006][63735] Sum rewards: -5.739, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.486', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.011', 'weapon4': '0.022', 'ARMOR': '0.032', 'WEAPON4': '0.100', 'HITCOUNT': '0.170', 'AMMO3': '0.217', 'DAMAGECOUNT': '0.720', 'WEAPON3': '1.000', 'weapon2': '1.292', 'weapon3': '1.426', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:43:30,799][63770] DAMAGECOUNT value on done: 1104.0 +[2023-09-14 14:43:30,799][63770] Sum rewards: 1.594, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.596', 'WEAPON1': '0.010', 'AMMO5': '0.016', 'AMMO2': '0.017', 'ARMOR': '0.056', 'AMMO3': '0.083', 'AMMO4': '0.083', 'WEAPON4': '0.100', 'weapon4': '0.180', 'weapon5': '0.224', 'HITCOUNT': '0.260', 'WEAPON5': '0.350', 'WEAPON3': '0.450', 'weapon3': '0.864', 'DAMAGECOUNT': '1.446', 'weapon2': '1.550', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:43:31,171][63770] DAMAGECOUNT value on done: 1686.0 +[2023-09-14 14:43:31,172][63770] Sum rewards: -5.726, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.814', 'WEAPON1': '0.010', 'ARMOR': '0.024', 'AMMO2': '0.026', 'weapon4': '0.064', 'AMMO3': '0.111', 'AMMO4': '0.130', 'HITCOUNT': '0.150', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.178', 'weapon2': '1.538'} +[2023-09-14 14:43:32,222][63732] Updated weights for policy 0, policy_version 550 (0.0010) +[2023-09-14 14:43:32,461][63454] Saving new best policy, reward=-5.407! +[2023-09-14 14:43:33,731][63805] DAMAGECOUNT value on done: 1349.0 +[2023-09-14 14:43:33,732][63805] Sum rewards: -9.418, reward structure: {'DEATHCOUNT': '-11.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.074', 'AMMO2': '0.005', 'ARMOR': '0.016', 'AMMO5': '0.019', 'WEAPON1': '0.020', 'AMMO4': '0.026', 'HITCOUNT': '0.040', 'WEAPON4': '0.050', 'weapon4': '0.060', 'DAMAGECOUNT': '0.072', 'weapon5': '0.082', 'AMMO3': '0.167', 'WEAPON5': '0.350', 'WEAPON3': '0.800', 'weapon3': '1.156', 'weapon2': '1.542'} +[2023-09-14 14:43:34,079][63805] DAMAGECOUNT value on done: 2070.0 +[2023-09-14 14:43:34,751][63734] DAMAGECOUNT value on done: 1139.0 +[2023-09-14 14:43:34,751][63734] Sum rewards: -6.380, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.398', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'WEAPON1': '0.010', 'AMMO5': '0.024', 'HITCOUNT': '0.080', 'weapon5': '0.100', 'AMMO3': '0.133', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.345', 'WEAPON3': '0.700', 'ARMOR': '0.908', 'weapon2': '1.278', 'weapon3': '1.672'} +[2023-09-14 14:43:34,842][63734] DAMAGECOUNT value on done: 1754.0 +[2023-09-14 14:43:34,843][63734] Sum rewards: -4.059, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.480', 'AMMO5': '0.003', 'AMMO2': '0.035', 'WEAPON5': '0.050', 'ARMOR': '0.060', 'AMMO3': '0.117', 'AMMO4': '0.177', 'HITCOUNT': '0.200', 'weapon4': '0.438', 'WEAPON4': '0.450', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.801', 'weapon3': '0.996', 'weapon2': '1.444', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:43:35,124][63735] DAMAGECOUNT value on done: 1164.0 +[2023-09-14 14:43:35,125][63735] Sum rewards: -3.542, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.672', 'AMMO5': '0.015', 'AMMO2': '0.025', 'HITCOUNT': '0.060', 'ARMOR': '0.064', 'WEAPON5': '0.100', 'AMMO3': '0.111', 'AMMO4': '0.124', 'DAMAGECOUNT': '0.237', 'WEAPON4': '0.400', 'weapon4': '0.438', 'WEAPON3': '0.600', 'weapon3': '0.704', 'FRAGCOUNT': '1.000', 'weapon2': '1.752'} +[2023-09-14 14:43:35,156][63734] DAMAGECOUNT value on done: 1355.0 +[2023-09-14 14:43:35,157][63734] Sum rewards: -0.758, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.277', 'AMMO5': '0.003', 'ARMOR': '0.004', 'AMMO2': '0.008', 'AMMO4': '0.039', 'weapon4': '0.042', 'WEAPON5': '0.050', 'weapon7': '0.054', 'AMMO3': '0.096', 'WEAPON4': '0.150', 'AMMO6': '0.160', 'AMMO7': '0.160', 'HITCOUNT': '0.190', 'WEAPON7': '0.200', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.125', 'weapon3': '1.298', 'weapon2': '1.340'} +[2023-09-14 14:43:35,264][63734] DAMAGECOUNT value on done: 1767.0 +[2023-09-14 14:43:35,264][63734] Sum rewards: -4.062, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.060', 'AMMO4': '-0.029', 'AMMO2': '-0.006', 'AMMO5': '0.005', 'ARMOR': '0.040', 'WEAPON5': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.165', 'DAMAGECOUNT': '0.459', 'WEAPON3': '0.800', 'weapon2': '1.074', 'weapon3': '1.500', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:43:35,573][63767] DAMAGECOUNT value on done: 1335.0 +[2023-09-14 14:43:35,574][63767] Sum rewards: -4.298, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.036', 'AMMO5': '0.009', 'AMMO2': '0.020', 'WEAPON1': '0.040', 'weapon5': '0.088', 'WEAPON5': '0.100', 'AMMO4': '0.100', 'AMMO3': '0.123', 'HITCOUNT': '0.150', 'weapon4': '0.202', 'WEAPON4': '0.300', 'ARMOR': '0.404', 'DAMAGECOUNT': '0.576', 'WEAPON3': '0.700', 'weapon3': '0.788', 'weapon2': '1.888', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:43:35,574][63735] DAMAGECOUNT value on done: 1335.0 +[2023-09-14 14:43:35,575][63735] Sum rewards: -3.408, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.069', 'AMMO2': '0.007', 'ARMOR': '0.028', 'AMMO4': '0.037', 'weapon4': '0.096', 'WEAPON4': '0.100', 'AMMO3': '0.126', 'HITCOUNT': '0.140', 'DAMAGECOUNT': '0.477', 'WEAPON3': '0.650', 'weapon2': '0.964', 'FRAGCOUNT': '1.000', 'weapon3': '1.536'} +[2023-09-14 14:43:35,908][63767] DAMAGECOUNT value on done: 1498.0 +[2023-09-14 14:43:35,909][63767] Sum rewards: -4.694, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.683', 'AMMO2': '0.004', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.020', 'ARMOR': '0.028', 'weapon5': '0.058', 'HITCOUNT': '0.140', 'AMMO3': '0.173', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.552', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.292', 'weapon3': '1.486'} +[2023-09-14 14:43:36,072][63733] Updated weights for policy 1, policy_version 590 (0.0011) +[2023-09-14 14:43:37,466][63454] Saving new best policy, reward=-5.311! +[2023-09-14 14:43:38,145][63767] DAMAGECOUNT value on done: 2144.0 +[2023-09-14 14:43:38,145][63767] Sum rewards: -2.630, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.080', 'AMMO5': '0.003', 'AMMO2': '0.003', 'weapon5': '0.006', 'ARMOR': '0.008', 'AMMO4': '0.015', 'WEAPON5': '0.050', 'HITCOUNT': '0.110', 'AMMO3': '0.138', 'DAMAGECOUNT': '0.387', 'WEAPON3': '0.800', 'weapon2': '0.886', 'weapon3': '1.544', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:43:38,332][63769] DAMAGECOUNT value on done: 1326.0 +[2023-09-14 14:43:38,333][63769] Sum rewards: -3.458, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.552', 'AMMO2': '0.020', 'HITCOUNT': '0.080', 'ARMOR': '0.088', 'WEAPON4': '0.100', 'AMMO4': '0.101', 'AMMO3': '0.119', 'DAMAGECOUNT': '0.270', 'weapon4': '0.352', 'WEAPON3': '0.700', 'weapon3': '0.838', 'FRAGCOUNT': '1.000', 'weapon2': '1.176'} +[2023-09-14 14:43:38,396][63805] DAMAGECOUNT value on done: 1131.0 +[2023-09-14 14:43:38,537][63767] DAMAGECOUNT value on done: 1707.0 +[2023-09-14 14:43:38,632][63732] Updated weights for policy 0, policy_version 560 (0.0010) +[2023-09-14 14:43:38,768][63805] DAMAGECOUNT value on done: 1519.0 +[2023-09-14 14:43:38,784][63769] DAMAGECOUNT value on done: 1258.0 +[2023-09-14 14:43:42,461][63454] Saving new best policy, reward=-5.292! +[2023-09-14 14:43:42,667][63770] DAMAGECOUNT value on done: 1408.0 +[2023-09-14 14:43:43,038][63770] DAMAGECOUNT value on done: 1221.0 +[2023-09-14 14:43:43,045][63771] DAMAGECOUNT value on done: 1070.0 +[2023-09-14 14:43:43,425][63771] DAMAGECOUNT value on done: 1340.0 +[2023-09-14 14:43:43,701][63771] DAMAGECOUNT value on done: 1415.0 +[2023-09-14 14:43:43,753][63769] DAMAGECOUNT value on done: 1771.0 +[2023-09-14 14:43:44,034][63771] DAMAGECOUNT value on done: 2066.0 +[2023-09-14 14:43:44,035][63771] Sum rewards: -3.717, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.804', 'AMMO2': '0.015', 'ARMOR': '0.052', 'AMMO4': '0.074', 'weapon4': '0.098', 'WEAPON4': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.196', 'DAMAGECOUNT': '0.540', 'weapon2': '1.060', 'WEAPON3': '1.100', 'weapon3': '1.462', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:43:44,107][63733] Updated weights for policy 1, policy_version 600 (0.0010) +[2023-09-14 14:43:44,136][63769] DAMAGECOUNT value on done: 1141.0 +[2023-09-14 14:43:44,136][63769] Sum rewards: -5.166, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.885', 'AMMO4': '-0.020', 'AMMO2': '-0.004', 'weapon5': '0.004', 'AMMO5': '0.010', 'ARMOR': '0.032', 'WEAPON5': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.165', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.850', 'weapon2': '1.288', 'weapon3': '1.334', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:43:44,925][63732] Updated weights for policy 0, policy_version 570 (0.0010) +[2023-09-14 14:43:45,106][63806] DAMAGECOUNT value on done: 1738.0 +[2023-09-14 14:43:45,106][63806] Sum rewards: -0.396, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.771', 'WEAPON1': '0.010', 'AMMO5': '0.018', 'AMMO2': '0.028', 'weapon7': '0.032', 'ARMOR': '0.072', 'weapon4': '0.084', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'weapon5': '0.102', 'AMMO3': '0.122', 'AMMO4': '0.140', 'HITCOUNT': '0.180', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.615', 'WEAPON3': '0.700', 'weapon3': '1.290', 'weapon2': '1.382', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:43:45,401][63806] DAMAGECOUNT value on done: 1971.0 +[2023-09-14 14:43:45,402][63806] Sum rewards: -10.115, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-3.288', 'AMMO2': '0.020', 'AMMO5': '0.020', 'HITCOUNT': '0.030', 'WEAPON1': '0.040', 'weapon4': '0.084', 'AMMO4': '0.099', 'weapon5': '0.114', 'AMMO3': '0.202', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.264', 'WEAPON5': '0.300', 'ARMOR': '0.436', 'FRAGCOUNT': '1.000', 'weapon3': '1.066', 'WEAPON3': '1.150', 'weapon2': '1.598'} +[2023-09-14 14:43:45,479][63806] DAMAGECOUNT value on done: 1135.0 +[2023-09-14 14:43:45,480][63806] Sum rewards: -10.285, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.628', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.012', 'AMMO2': '0.013', 'AMMO4': '0.066', 'HITCOUNT': '0.100', 'weapon5': '0.138', 'AMMO3': '0.143', 'DAMAGECOUNT': '0.279', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon4': '0.358', 'ARMOR': '0.447', 'WEAPON3': '0.800', 'weapon3': '1.090', 'weapon2': '1.546'} +[2023-09-14 14:43:45,783][63806] DAMAGECOUNT value on done: 1558.0 +[2023-09-14 14:43:51,180][63732] Updated weights for policy 0, policy_version 580 (0.0011) +[2023-09-14 14:43:51,839][63735] DAMAGECOUNT value on done: 2092.0 +[2023-09-14 14:43:51,839][63735] Sum rewards: -9.337, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.140', 'AMMO2': '0.023', 'ARMOR': '0.068', 'HITCOUNT': '0.070', 'AMMO4': '0.113', 'DAMAGECOUNT': '0.135', 'AMMO3': '0.180', 'weapon4': '0.202', 'WEAPON4': '0.250', 'WEAPON3': '0.750', 'weapon3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.112'} +[2023-09-14 14:43:52,192][63733] Updated weights for policy 1, policy_version 610 (0.0011) +[2023-09-14 14:43:52,250][63735] DAMAGECOUNT value on done: 2070.0 +[2023-09-14 14:43:53,682][63770] DAMAGECOUNT value on done: 1180.0 +[2023-09-14 14:43:53,682][63770] Sum rewards: 0.278, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.040', 'AMMO5': '0.007', 'AMMO2': '0.012', 'WEAPON1': '0.030', 'weapon5': '0.042', 'AMMO4': '0.062', 'HITCOUNT': '0.080', 'AMMO3': '0.090', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.228', 'ARMOR': '0.500', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon2': '1.320', 'weapon3': '1.546'} +[2023-09-14 14:43:54,025][63770] DAMAGECOUNT value on done: 1738.0 +[2023-09-14 14:43:56,844][63805] DAMAGECOUNT value on done: 1469.0 +[2023-09-14 14:43:56,845][63805] Sum rewards: -7.595, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.982', 'ARMOR': '0.004', 'AMMO5': '0.007', 'AMMO2': '0.011', 'AMMO4': '0.053', 'HITCOUNT': '0.070', 'weapon5': '0.072', 'AMMO3': '0.134', 'WEAPON5': '0.150', 'WEAPON4': '0.300', 'weapon4': '0.340', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.238', 'weapon2': '1.348'} +[2023-09-14 14:43:57,202][63805] DAMAGECOUNT value on done: 2153.0 +[2023-09-14 14:43:57,202][63805] Sum rewards: -11.089, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-1.635', 'FRAGCOUNT': '-1.500', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'AMMO2': '0.041', 'weapon5': '0.062', 'HITCOUNT': '0.090', 'AMMO3': '0.091', 'AMMO4': '0.207', 'weapon4': '0.214', 'DAMAGECOUNT': '0.249', 'WEAPON5': '0.250', 'WEAPON4': '0.400', 'weapon3': '0.406', 'WEAPON3': '0.500', 'ARMOR': '0.534', 'weapon2': '2.476'} +[2023-09-14 14:43:57,491][63732] Updated weights for policy 0, policy_version 590 (0.0010) +[2023-09-14 14:43:58,231][63734] DAMAGECOUNT value on done: 1369.0 +[2023-09-14 14:43:58,232][63734] Sum rewards: -3.738, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.238', 'AMMO5': '0.005', 'AMMO2': '0.009', 'AMMO4': '0.045', 'WEAPON5': '0.050', 'AMMO3': '0.068', 'weapon7': '0.086', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.150', 'HITCOUNT': '0.150', 'WEAPON7': '0.200', 'weapon4': '0.294', 'ARMOR': '0.440', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.690', 'FRAGCOUNT': '1.000', 'weapon3': '1.030', 'weapon2': '1.592'} +[2023-09-14 14:43:58,486][63767] DAMAGECOUNT value on done: 1565.0 +[2023-09-14 14:43:58,487][63767] Sum rewards: -3.091, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.724', 'AMMO5': '0.016', 'AMMO2': '0.024', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'AMMO4': '0.118', 'weapon5': '0.124', 'AMMO3': '0.127', 'WEAPON5': '0.250', 'weapon4': '0.342', 'ARMOR': '0.400', 'DAMAGECOUNT': '0.690', 'WEAPON3': '0.700', 'weapon2': '1.076', 'weapon3': '1.326', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:43:58,587][63734] DAMAGECOUNT value on done: 1490.0 +[2023-09-14 14:43:58,870][63767] DAMAGECOUNT value on done: 1590.0 +[2023-09-14 14:43:59,538][63735] DAMAGECOUNT value on done: 1327.0 +[2023-09-14 14:43:59,539][63735] Sum rewards: -4.172, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.969', 'weapon5': '0.006', 'AMMO2': '0.008', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.040', 'weapon7': '0.074', 'AMMO3': '0.075', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.140', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.252', 'DAMAGECOUNT': '0.489', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.254', 'weapon2': '1.302'} +[2023-09-14 14:43:59,740][63734] DAMAGECOUNT value on done: 1901.0 +[2023-09-14 14:43:59,741][63734] Sum rewards: -2.379, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.360', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO2': '0.034', 'weapon5': '0.040', 'AMMO3': '0.075', 'HITCOUNT': '0.080', 'weapon7': '0.102', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO4': '0.169', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.234', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.441', 'WEAPON3': '0.450', 'ARMOR': '0.458', 'weapon3': '0.934', 'FRAGCOUNT': '1.000', 'weapon2': '1.542'} +[2023-09-14 14:43:59,866][63735] DAMAGECOUNT value on done: 1479.0 +[2023-09-14 14:43:59,867][63735] Sum rewards: -5.456, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.446', 'AMMO2': '0.002', 'AMMO4': '0.011', 'ARMOR': '0.036', 'HITCOUNT': '0.090', 'AMMO3': '0.173', 'DAMAGECOUNT': '0.432', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.158', 'weapon3': '1.238'} +[2023-09-14 14:44:00,134][63734] DAMAGECOUNT value on done: 1977.0 +[2023-09-14 14:44:00,135][63734] Sum rewards: -5.770, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.924', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.004', 'weapon5': '0.012', 'AMMO5': '0.013', 'AMMO4': '0.021', 'WEAPON1': '0.030', 'weapon7': '0.036', 'ARMOR': '0.040', 'WEAPON4': '0.100', 'HITCOUNT': '0.130', 'weapon4': '0.132', 'AMMO3': '0.140', 'WEAPON5': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.700', 'weapon2': '1.006', 'weapon3': '1.160'} +[2023-09-14 14:44:00,265][63733] Updated weights for policy 1, policy_version 620 (0.0011) +[2023-09-14 14:44:00,595][63767] DAMAGECOUNT value on done: 2289.0 +[2023-09-14 14:44:00,596][63767] Sum rewards: -0.098, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.007', 'AMMO2': '0.018', 'weapon5': '0.036', 'ARMOR': '0.046', 'HEALTH': '0.060', 'weapon4': '0.064', 'AMMO3': '0.077', 'AMMO4': '0.090', 'HITCOUNT': '0.100', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.450', 'weapon2': '0.754', 'FRAGCOUNT': '1.000', 'weapon3': '1.664'} +[2023-09-14 14:44:00,855][63805] DAMAGECOUNT value on done: 1281.0 +[2023-09-14 14:44:00,856][63805] Sum rewards: -6.044, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.040', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.011', 'WEAPON5': '0.050', 'AMMO4': '0.052', 'HITCOUNT': '0.100', 'AMMO3': '0.156', 'ARMOR': '0.416', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.012', 'weapon3': '1.586'} +[2023-09-14 14:44:00,941][63767] DAMAGECOUNT value on done: 1757.0 +[2023-09-14 14:44:00,941][63767] Sum rewards: -5.369, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.808', 'AMMO2': '0.010', 'ARMOR': '0.044', 'AMMO4': '0.050', 'WEAPON4': '0.050', 'HITCOUNT': '0.050', 'weapon4': '0.106', 'DAMAGECOUNT': '0.150', 'AMMO3': '0.171', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.080', 'weapon3': '1.128'} +[2023-09-14 14:44:01,238][63805] DAMAGECOUNT value on done: 1634.0 +[2023-09-14 14:44:01,238][63805] Sum rewards: -4.396, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.252', 'AMMO2': '0.002', 'AMMO5': '0.010', 'AMMO4': '0.011', 'ARMOR': '0.024', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.158', 'weapon4': '0.172', 'DAMAGECOUNT': '0.345', 'weapon2': '0.926', 'WEAPON3': '0.950', 'weapon3': '1.298', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:44:03,233][63769] DAMAGECOUNT value on done: 1461.0 +[2023-09-14 14:44:03,234][63769] Sum rewards: -4.093, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.826', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'weapon5': '0.020', 'AMMO2': '0.027', 'HITCOUNT': '0.090', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.114', 'AMMO4': '0.136', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.234', 'weapon2': '1.332'} +[2023-09-14 14:44:03,618][63769] DAMAGECOUNT value on done: 1303.0 +[2023-09-14 14:44:03,619][63769] Sum rewards: -9.288, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-3.000', 'HEALTH': '-0.830', 'AMMO5': '0.014', 'AMMO2': '0.018', 'weapon5': '0.020', 'ARMOR': '0.035', 'HITCOUNT': '0.040', 'weapon7': '0.066', 'AMMO3': '0.074', 'AMMO4': '0.091', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'DAMAGECOUNT': '0.135', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'weapon4': '0.300', 'WEAPON3': '0.450', 'weapon3': '0.880', 'weapon2': '1.518'} +[2023-09-14 14:44:03,733][63732] Updated weights for policy 0, policy_version 600 (0.0011) +[2023-09-14 14:44:05,739][63770] DAMAGECOUNT value on done: 1558.0 +[2023-09-14 14:44:05,740][63770] Sum rewards: -5.820, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.585', 'AMMO5': '0.005', 'AMMO2': '0.038', 'WEAPON5': '0.100', 'AMMO3': '0.103', 'HITCOUNT': '0.140', 'AMMO4': '0.191', 'weapon4': '0.304', 'WEAPON4': '0.400', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.600', 'weapon2': '0.974', 'FRAGCOUNT': '1.000', 'weapon3': '1.460'} +[2023-09-14 14:44:05,752][63771] DAMAGECOUNT value on done: 1225.0 +[2023-09-14 14:44:05,752][63771] Sum rewards: -6.449, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.764', 'AMMO5': '0.005', 'AMMO2': '0.013', 'weapon5': '0.024', 'WEAPON4': '0.050', 'ARMOR': '0.057', 'AMMO4': '0.064', 'weapon4': '0.096', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.181', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.800', 'weapon3': '1.142', 'weapon2': '1.208', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:44:06,067][63770] DAMAGECOUNT value on done: 1456.0 +[2023-09-14 14:44:06,068][63770] Sum rewards: -2.482, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.800', 'AMMO5': '0.010', 'weapon4': '0.016', 'WEAPON1': '0.020', 'AMMO2': '0.021', 'WEAPON4': '0.050', 'AMMO3': '0.056', 'weapon7': '0.088', 'HITCOUNT': '0.100', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO4': '0.106', 'weapon5': '0.178', 'WEAPON5': '0.300', 'WEAPON3': '0.300', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.705', 'weapon3': '0.912', 'weapon2': '1.406'} +[2023-09-14 14:44:06,143][63771] DAMAGECOUNT value on done: 1450.0 +[2023-09-14 14:44:06,144][63771] Sum rewards: -2.672, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.852', 'AMMO5': '0.003', 'AMMO2': '0.012', 'weapon5': '0.018', 'WEAPON5': '0.050', 'AMMO4': '0.062', 'ARMOR': '0.077', 'AMMO3': '0.104', 'HITCOUNT': '0.130', 'weapon4': '0.130', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.600', 'weapon3': '0.830', 'weapon2': '1.434', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:44:06,630][63769] DAMAGECOUNT value on done: 1786.0 +[2023-09-14 14:44:07,017][63769] DAMAGECOUNT value on done: 1175.0 +[2023-09-14 14:44:07,377][63806] DAMAGECOUNT value on done: 1815.0 +[2023-09-14 14:44:07,378][63806] Sum rewards: -6.917, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.152', 'AMMO5': '0.008', 'WEAPON1': '0.020', 'AMMO2': '0.033', 'weapon5': '0.066', 'AMMO3': '0.078', 'HITCOUNT': '0.100', 'AMMO4': '0.165', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.231', 'WEAPON4': '0.400', 'WEAPON3': '0.400', 'weapon4': '0.644', 'weapon3': '0.788', 'ARMOR': '0.892', 'FRAGCOUNT': '1.000', 'weapon2': '1.210'} +[2023-09-14 14:44:07,466][63454] Saving new best policy, reward=-5.285! +[2023-09-14 14:44:07,738][63806] DAMAGECOUNT value on done: 2029.0 +[2023-09-14 14:44:07,782][63806] DAMAGECOUNT value on done: 1285.0 +[2023-09-14 14:44:07,783][63806] Sum rewards: -4.671, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.156', 'AMMO5': '0.010', 'AMMO2': '0.020', 'weapon5': '0.044', 'weapon7': '0.058', 'AMMO4': '0.099', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'HITCOUNT': '0.120', 'AMMO3': '0.140', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.254', 'weapon3': '1.640'} +[2023-09-14 14:44:08,111][63806] DAMAGECOUNT value on done: 1998.0 +[2023-09-14 14:44:08,112][63806] Sum rewards: -1.085, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.250', 'weapon5': '0.002', 'AMMO5': '0.010', 'AMMO2': '0.013', 'weapon7': '0.016', 'AMMO4': '0.065', 'weapon4': '0.072', 'WEAPON4': '0.100', 'AMMO3': '0.132', 'WEAPON5': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.280', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.020', 'weapon3': '1.060', 'weapon2': '1.394', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:44:08,354][63733] Updated weights for policy 1, policy_version 630 (0.0011) +[2023-09-14 14:44:08,519][63771] DAMAGECOUNT value on done: 1530.0 +[2023-09-14 14:44:08,520][63771] Sum rewards: -9.316, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.072', 'FRAGCOUNT': '-1.500', 'ARMOR': '0.012', 'AMMO2': '0.024', 'AMMO5': '0.024', 'weapon5': '0.060', 'weapon7': '0.086', 'HITCOUNT': '0.090', 'AMMO4': '0.119', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.132', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.345', 'WEAPON4': '0.350', 'WEAPON5': '0.400', 'weapon4': '0.402', 'WEAPON3': '0.650', 'weapon3': '0.822', 'weapon2': '1.550'} +[2023-09-14 14:44:08,874][63771] DAMAGECOUNT value on done: 2252.0 +[2023-09-14 14:44:08,874][63771] Sum rewards: -3.615, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.350', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'weapon4': '0.052', 'AMMO4': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.124', 'HITCOUNT': '0.160', 'DAMAGECOUNT': '0.558', 'WEAPON3': '0.650', 'weapon2': '0.982', 'FRAGCOUNT': '1.000', 'weapon3': '1.330'} +[2023-09-14 14:44:10,232][63732] Updated weights for policy 0, policy_version 610 (0.0011) +[2023-09-14 14:44:14,103][63735] DAMAGECOUNT value on done: 2182.0 +[2023-09-14 14:44:14,103][63735] Sum rewards: -12.481, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-3.855', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.003', 'ARMOR': '0.048', 'WEAPON5': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.204', 'DAMAGECOUNT': '0.270', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.200', 'weapon3': '1.330', 'weapon2': '1.470'} +[2023-09-14 14:44:14,455][63735] DAMAGECOUNT value on done: 2155.0 +[2023-09-14 14:44:16,564][63733] Updated weights for policy 1, policy_version 640 (0.0012) +[2023-09-14 14:44:16,651][63732] Updated weights for policy 0, policy_version 620 (0.0012) +[2023-09-14 14:44:16,859][63770] DAMAGECOUNT value on done: 1255.0 +[2023-09-14 14:44:16,860][63770] Sum rewards: -7.566, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.353', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.031', 'AMMO3': '0.071', 'HITCOUNT': '0.080', 'WEAPON5': '0.100', 'AMMO4': '0.153', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.225', 'weapon4': '0.242', 'WEAPON3': '0.450', 'ARMOR': '0.532', 'weapon3': '1.036', 'weapon2': '1.654'} +[2023-09-14 14:44:17,198][63770] DAMAGECOUNT value on done: 2061.0 +[2023-09-14 14:44:17,198][63770] Sum rewards: -7.431, reward structure: {'DEATHCOUNT': '-15.000', 'HEALTH': '-1.288', 'WEAPON1': '0.010', 'weapon5': '0.024', 'AMMO5': '0.025', 'AMMO2': '0.028', 'weapon4': '0.082', 'AMMO4': '0.140', 'AMMO3': '0.200', 'HITCOUNT': '0.230', 'WEAPON5': '0.250', 'WEAPON4': '0.250', 'WEAPON3': '0.950', 'DAMAGECOUNT': '0.969', 'weapon2': '1.182', 'weapon3': '1.516', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:44:20,192][63805] DAMAGECOUNT value on done: 1489.0 +[2023-09-14 14:44:20,569][63805] DAMAGECOUNT value on done: 2233.0 +[2023-09-14 14:44:20,570][63805] Sum rewards: -4.580, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.447', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.023', 'AMMO2': '0.027', 'weapon5': '0.034', 'HITCOUNT': '0.080', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.118', 'AMMO4': '0.137', 'DAMAGECOUNT': '0.240', 'WEAPON4': '0.300', 'WEAPON5': '0.350', 'WEAPON3': '0.700', 'weapon4': '0.710', 'weapon3': '0.872', 'ARMOR': '1.034', 'weapon2': '1.442'} +[2023-09-14 14:44:21,661][63767] DAMAGECOUNT value on done: 1760.0 +[2023-09-14 14:44:21,661][63767] Sum rewards: -4.441, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.158', 'AMMO5': '0.014', 'ARMOR': '0.016', 'AMMO2': '0.028', 'weapon5': '0.056', 'weapon7': '0.074', 'AMMO3': '0.091', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO4': '0.140', 'HITCOUNT': '0.160', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.585', 'WEAPON3': '0.600', 'weapon2': '1.296', 'weapon3': '1.306'} +[2023-09-14 14:44:21,903][63734] DAMAGECOUNT value on done: 1600.0 +[2023-09-14 14:44:21,904][63734] Sum rewards: -0.873, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.550', 'AMMO5': '0.018', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'weapon5': '0.050', 'AMMO4': '0.088', 'AMMO3': '0.092', 'HITCOUNT': '0.140', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.380', 'ARMOR': '0.432', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.693', 'FRAGCOUNT': '1.000', 'weapon2': '1.210', 'weapon3': '1.236'} +[2023-09-14 14:44:22,040][63767] DAMAGECOUNT value on done: 1759.0 +[2023-09-14 14:44:22,041][63767] Sum rewards: 0.308, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.910', 'AMMO5': '0.012', 'AMMO2': '0.022', 'WEAPON1': '0.040', 'weapon5': '0.080', 'WEAPON4': '0.100', 'AMMO4': '0.110', 'AMMO3': '0.120', 'HITCOUNT': '0.210', 'weapon4': '0.214', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.550', 'weapon3': '1.148', 'weapon2': '1.354', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:44:22,300][63734] DAMAGECOUNT value on done: 1734.0 +[2023-09-14 14:44:22,461][63454] Saving new best policy, reward=-5.248! +[2023-09-14 14:44:22,966][63732] Updated weights for policy 0, policy_version 630 (0.0011) +[2023-09-14 14:44:23,233][63767] DAMAGECOUNT value on done: 2454.0 +[2023-09-14 14:44:23,234][63767] Sum rewards: -2.624, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.430', 'WEAPON1': '0.020', 'AMMO2': '0.022', 'weapon7': '0.058', 'AMMO4': '0.110', 'ARMOR': '0.112', 'AMMO3': '0.149', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'AMMO6': '0.160', 'AMMO7': '0.160', 'weapon4': '0.166', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.750', 'weapon2': '0.888', 'FRAGCOUNT': '1.000', 'weapon3': '1.466'} +[2023-09-14 14:44:23,605][63805] DAMAGECOUNT value on done: 1330.0 +[2023-09-14 14:44:23,606][63805] Sum rewards: -7.431, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.406', 'AMMO2': '0.005', 'AMMO4': '0.023', 'HITCOUNT': '0.060', 'AMMO3': '0.130', 'DAMAGECOUNT': '0.147', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.184', 'weapon3': '1.676'} +[2023-09-14 14:44:23,622][63767] DAMAGECOUNT value on done: 1882.0 +[2023-09-14 14:44:23,622][63767] Sum rewards: -6.125, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.712', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.007', 'AMMO5': '0.007', 'AMMO4': '0.034', 'WEAPON4': '0.050', 'weapon5': '0.072', 'HITCOUNT': '0.110', 'weapon4': '0.130', 'AMMO3': '0.144', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.900', 'weapon2': '0.976', 'weapon3': '1.332'} +[2023-09-14 14:44:23,975][63805] DAMAGECOUNT value on done: 1674.0 +[2023-09-14 14:44:24,093][63735] DAMAGECOUNT value on done: 1456.0 +[2023-09-14 14:44:24,094][63735] Sum rewards: -5.382, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.460', 'AMMO5': '0.005', 'AMMO2': '0.008', 'WEAPON1': '0.030', 'AMMO4': '0.041', 'weapon5': '0.046', 'WEAPON4': '0.050', 'AMMO3': '0.078', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'weapon4': '0.128', 'DAMAGECOUNT': '0.387', 'ARMOR': '0.456', 'WEAPON3': '0.500', 'weapon2': '1.382', 'weapon3': '1.506'} +[2023-09-14 14:44:24,445][63735] DAMAGECOUNT value on done: 1704.0 +[2023-09-14 14:44:24,446][63735] Sum rewards: -3.898, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.190', 'AMMO4': '-0.023', 'AMMO2': '-0.005', 'AMMO5': '0.005', 'WEAPON5': '0.050', 'HITCOUNT': '0.120', 'AMMO3': '0.157', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.850', 'weapon2': '1.204', 'weapon3': '1.258', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:44:24,957][63733] Updated weights for policy 1, policy_version 650 (0.0010) +[2023-09-14 14:44:25,025][63734] DAMAGECOUNT value on done: 2216.0 +[2023-09-14 14:44:25,025][63734] Sum rewards: -4.018, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.132', 'AMMO5': '0.020', 'AMMO2': '0.021', 'ARMOR': '0.044', 'weapon5': '0.050', 'AMMO4': '0.105', 'AMMO3': '0.125', 'weapon4': '0.174', 'WEAPON5': '0.200', 'HITCOUNT': '0.290', 'WEAPON4': '0.300', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.945', 'weapon2': '1.048', 'weapon3': '1.492', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:44:25,404][63734] DAMAGECOUNT value on done: 1986.0 +[2023-09-14 14:44:27,467][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000652_2670592.pth... +[2023-09-14 14:44:27,468][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000638_2613248.pth... +[2023-09-14 14:44:27,528][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000347_1421312.pth +[2023-09-14 14:44:27,531][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000269_1101824.pth +[2023-09-14 14:44:27,538][63454] Saving new best policy, reward=-5.177! +[2023-09-14 14:44:28,320][63732] Updated weights for policy 0, policy_version 640 (0.0011) +[2023-09-14 14:44:28,473][63769] DAMAGECOUNT value on done: 1481.0 +[2023-09-14 14:44:28,474][63769] Sum rewards: -3.169, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.215', 'AMMO2': '0.007', 'HITCOUNT': '0.030', 'AMMO4': '0.033', 'WEAPON4': '0.050', 'ARMOR': '0.052', 'DAMAGECOUNT': '0.060', 'weapon4': '0.082', 'AMMO3': '0.132', 'WEAPON3': '0.600', 'weapon3': '0.994', 'FRAGCOUNT': '1.000', 'weapon2': '1.506'} +[2023-09-14 14:44:28,644][63771] DAMAGECOUNT value on done: 1359.0 +[2023-09-14 14:44:28,644][63771] Sum rewards: -3.944, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.856', 'AMMO2': '0.011', 'WEAPON1': '0.020', 'ARMOR': '0.020', 'AMMO4': '0.056', 'HITCOUNT': '0.080', 'AMMO3': '0.097', 'DAMAGECOUNT': '0.402', 'WEAPON3': '0.450', 'weapon3': '0.930', 'FRAGCOUNT': '1.000', 'weapon2': '1.596'} +[2023-09-14 14:44:28,883][63769] DAMAGECOUNT value on done: 1433.0 +[2023-09-14 14:44:28,884][63769] Sum rewards: -9.363, reward structure: {'DEATHCOUNT': '-12.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.456', 'AMMO5': '0.012', 'weapon7': '0.016', 'AMMO2': '0.017', 'weapon5': '0.028', 'ARMOR': '0.036', 'AMMO4': '0.083', 'AMMO3': '0.119', 'weapon4': '0.120', 'HITCOUNT': '0.130', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.750', 'weapon3': '1.280', 'weapon2': '1.662'} +[2023-09-14 14:44:28,944][63770] DAMAGECOUNT value on done: 1665.0 +[2023-09-14 14:44:28,945][63770] Sum rewards: -6.784, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.981', 'weapon4': '0.004', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'ARMOR': '0.036', 'weapon5': '0.036', 'AMMO4': '0.084', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.156', 'DAMAGECOUNT': '0.321', 'WEAPON3': '0.900', 'weapon2': '1.024', 'weapon3': '1.794'} +[2023-09-14 14:44:29,066][63771] DAMAGECOUNT value on done: 1642.0 +[2023-09-14 14:44:29,066][63771] Sum rewards: -3.425, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.048', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.018', 'AMMO4': '0.087', 'AMMO3': '0.097', 'WEAPON5': '0.100', 'weapon4': '0.128', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.576', 'WEAPON3': '0.600', 'weapon2': '0.914', 'FRAGCOUNT': '1.000', 'weapon3': '1.768'} +[2023-09-14 14:44:29,272][63770] DAMAGECOUNT value on done: 1651.0 +[2023-09-14 14:44:29,273][63770] Sum rewards: -1.758, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.566', 'AMMO5': '0.005', 'AMMO2': '0.016', 'WEAPON5': '0.050', 'AMMO4': '0.078', 'AMMO3': '0.114', 'HITCOUNT': '0.160', 'WEAPON4': '0.200', 'weapon4': '0.262', 'ARMOR': '0.464', 'DAMAGECOUNT': '0.585', 'WEAPON3': '0.700', 'weapon3': '1.542', 'weapon2': '1.632', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:44:29,539][63769] DAMAGECOUNT value on done: 2065.0 +[2023-09-14 14:44:29,540][63769] Sum rewards: -4.389, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.671', 'AMMO5': '0.012', 'weapon5': '0.014', 'AMMO2': '0.017', 'ARMOR': '0.063', 'AMMO4': '0.084', 'AMMO3': '0.087', 'weapon4': '0.174', 'WEAPON4': '0.200', 'HITCOUNT': '0.250', 'WEAPON5': '0.250', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.600', 'weapon2': '0.768', 'DAMAGECOUNT': '0.837', 'weapon3': '1.676'} +[2023-09-14 14:44:29,953][63769] DAMAGECOUNT value on done: 1275.0 +[2023-09-14 14:44:29,953][63769] Sum rewards: 0.093, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-1.060', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'AMMO5': '0.005', 'HITCOUNT': '0.050', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.106', 'DAMAGECOUNT': '0.300', 'weapon4': '0.346', 'WEAPON3': '0.450', 'ARMOR': '0.481', 'weapon2': '0.852', 'FRAGCOUNT': '1.000', 'weapon3': '1.138'} +[2023-09-14 14:44:30,380][63806] DAMAGECOUNT value on done: 1955.0 +[2023-09-14 14:44:30,381][63806] Sum rewards: -6.479, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.148', 'AMMO5': '0.007', 'AMMO2': '0.018', 'weapon5': '0.022', 'WEAPON1': '0.040', 'ARMOR': '0.064', 'HITCOUNT': '0.080', 'AMMO4': '0.091', 'WEAPON5': '0.150', 'AMMO3': '0.156', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.420', 'weapon4': '0.438', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.172', 'weapon2': '1.360'} +[2023-09-14 14:44:30,841][63806] DAMAGECOUNT value on done: 2153.0 +[2023-09-14 14:44:30,842][63806] Sum rewards: -6.552, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.684', 'AMMO5': '0.009', 'AMMO2': '0.020', 'weapon5': '0.036', 'HITCOUNT': '0.080', 'AMMO4': '0.099', 'WEAPON5': '0.100', 'AMMO3': '0.101', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.372', 'weapon4': '0.376', 'ARMOR': '0.400', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.244', 'weapon2': '1.694'} +[2023-09-14 14:44:30,930][63806] DAMAGECOUNT value on done: 1300.0 +[2023-09-14 14:44:31,371][63806] DAMAGECOUNT value on done: 2073.0 +[2023-09-14 14:44:31,371][63806] Sum rewards: -3.228, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.110', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'AMMO2': '0.019', 'ARMOR': '0.020', 'WEAPON4': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.092', 'AMMO4': '0.096', 'weapon4': '0.100', 'weapon5': '0.136', 'DAMAGECOUNT': '0.225', 'WEAPON5': '0.300', 'WEAPON3': '0.450', 'weapon2': '0.968', 'weapon3': '1.590'} +[2023-09-14 14:44:34,616][63771] DAMAGECOUNT value on done: 1650.0 +[2023-09-14 14:44:34,974][63732] Updated weights for policy 0, policy_version 650 (0.0015) +[2023-09-14 14:44:35,113][63771] DAMAGECOUNT value on done: 2567.0 +[2023-09-14 14:44:35,114][63771] Sum rewards: -4.448, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.785', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.005', 'weapon5': '0.006', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'AMMO3': '0.134', 'HITCOUNT': '0.250', 'FRAGCOUNT': '0.500', 'weapon2': '0.646', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.945', 'weapon3': '2.120'} +[2023-09-14 14:44:36,631][63733] Updated weights for policy 1, policy_version 660 (0.0011) +[2023-09-14 14:44:36,968][63735] DAMAGECOUNT value on done: 2307.0 +[2023-09-14 14:44:36,969][63735] Sum rewards: -3.668, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.650', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'weapon4': '0.038', 'WEAPON4': '0.050', 'ARMOR': '0.068', 'HITCOUNT': '0.070', 'AMMO3': '0.088', 'WEAPON5': '0.100', 'weapon5': '0.104', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.450', 'FRAGCOUNT': '0.500', 'weapon3': '1.014', 'weapon2': '1.108'} +[2023-09-14 14:44:37,400][63735] DAMAGECOUNT value on done: 2315.0 +[2023-09-14 14:44:37,401][63735] Sum rewards: -4.021, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.560', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.017', 'AMMO2': '-0.003', 'weapon5': '0.006', 'AMMO5': '0.009', 'ARMOR': '0.040', 'AMMO3': '0.093', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.116', 'HITCOUNT': '0.120', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.600', 'weapon3': '1.024', 'weapon2': '1.370'} +[2023-09-14 14:44:37,466][63454] Saving new best policy, reward=-5.174! +[2023-09-14 14:44:37,466][63576] Saving new best policy, reward=-5.309! +[2023-09-14 14:44:41,368][63732] Updated weights for policy 0, policy_version 660 (0.0012) +[2023-09-14 14:44:41,993][63770] DAMAGECOUNT value on done: 1280.0 +[2023-09-14 14:44:42,325][63770] DAMAGECOUNT value on done: 2111.0 +[2023-09-14 14:44:45,292][63805] DAMAGECOUNT value on done: 1580.0 +[2023-09-14 14:44:45,292][63805] Sum rewards: -2.870, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.882', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.017', 'WEAPON1': '0.020', 'AMMO4': '0.083', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.141', 'WEAPON5': '0.150', 'weapon7': '0.154', 'AMMO6': '0.220', 'AMMO7': '0.220', 'DAMAGECOUNT': '0.273', 'WEAPON7': '0.300', 'ARMOR': '0.460', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.338', 'weapon2': '1.658'} +[2023-09-14 14:44:45,688][63805] DAMAGECOUNT value on done: 2362.0 +[2023-09-14 14:44:45,689][63805] Sum rewards: -3.926, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.342', 'AMMO2': '0.000', 'AMMO4': '0.002', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'weapon5': '0.034', 'WEAPON5': '0.100', 'HITCOUNT': '0.130', 'AMMO3': '0.170', 'WEAPON4': '0.200', 'weapon4': '0.262', 'DAMAGECOUNT': '0.387', 'ARMOR': '0.518', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.254', 'weapon3': '1.684'} +[2023-09-14 14:44:46,142][63733] Updated weights for policy 1, policy_version 670 (0.0011) +[2023-09-14 14:44:46,605][63767] DAMAGECOUNT value on done: 2029.0 +[2023-09-14 14:44:46,605][63767] Sum rewards: -0.014, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.596', 'AMMO2': '0.007', 'AMMO5': '0.013', 'weapon5': '0.016', 'AMMO4': '0.032', 'WEAPON4': '0.050', 'weapon4': '0.066', 'AMMO3': '0.115', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon7': '0.128', 'WEAPON5': '0.150', 'WEAPON7': '0.200', 'HITCOUNT': '0.220', 'ARMOR': '0.428', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.807', 'weapon2': '1.396', 'weapon3': '1.514', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:44:46,999][63767] DAMAGECOUNT value on done: 1823.0 +[2023-09-14 14:44:47,309][63734] DAMAGECOUNT value on done: 1751.0 +[2023-09-14 14:44:47,310][63734] Sum rewards: 0.103, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.385', 'weapon4': '0.004', 'AMMO5': '0.010', 'AMMO2': '0.016', 'weapon5': '0.016', 'WEAPON1': '0.030', 'weapon7': '0.034', 'WEAPON4': '0.050', 'AMMO4': '0.077', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.116', 'HITCOUNT': '0.150', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.453', 'WEAPON3': '0.500', 'ARMOR': '0.536', 'weapon2': '1.048', 'weapon3': '1.698', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:44:47,439][63732] Updated weights for policy 0, policy_version 670 (0.0011) +[2023-09-14 14:44:47,468][63454] Saving new best policy, reward=-5.059! +[2023-09-14 14:44:47,718][63734] DAMAGECOUNT value on done: 2036.0 +[2023-09-14 14:44:47,719][63734] Sum rewards: 0.831, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.182', 'AMMO5': '0.012', 'AMMO2': '0.013', 'WEAPON1': '0.020', 'weapon5': '0.020', 'ARMOR': '0.052', 'AMMO4': '0.064', 'AMMO3': '0.148', 'WEAPON5': '0.150', 'HITCOUNT': '0.190', 'WEAPON4': '0.200', 'weapon4': '0.218', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.906', 'weapon2': '1.550', 'weapon3': '1.620', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:44:48,278][63767] DAMAGECOUNT value on done: 2559.0 +[2023-09-14 14:44:48,279][63767] Sum rewards: -2.179, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.202', 'ARMOR': '0.004', 'AMMO2': '0.005', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.023', 'weapon7': '0.046', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.146', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.280', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.750', 'weapon2': '0.906', 'weapon3': '1.428', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:44:48,595][63767] DAMAGECOUNT value on done: 2074.0 +[2023-09-14 14:44:48,595][63767] Sum rewards: -5.780, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-0.500', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.029', 'AMMO3': '0.079', 'weapon5': '0.084', 'HEALTH': '0.096', 'weapon4': '0.112', 'HITCOUNT': '0.120', 'AMMO4': '0.142', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.576', 'weapon3': '1.112', 'weapon2': '2.048'} +[2023-09-14 14:44:48,776][63805] DAMAGECOUNT value on done: 1460.0 +[2023-09-14 14:44:48,776][63805] Sum rewards: -3.547, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.714', 'AMMO2': '0.013', 'AMMO5': '0.023', 'weapon5': '0.034', 'AMMO4': '0.063', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.150', 'WEAPON5': '0.250', 'weapon4': '0.256', 'DAMAGECOUNT': '0.390', 'ARMOR': '0.420', 'WEAPON3': '0.950', 'weapon2': '1.006', 'weapon3': '1.912', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:44:49,180][63805] DAMAGECOUNT value on done: 1843.0 +[2023-09-14 14:44:49,181][63805] Sum rewards: -5.136, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.290', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.012', 'WEAPON4': '0.050', 'HITCOUNT': '0.050', 'weapon4': '0.054', 'weapon5': '0.074', 'AMMO3': '0.158', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.850', 'weapon3': '1.384', 'weapon2': '1.470'} +[2023-09-14 14:44:50,636][63735] DAMAGECOUNT value on done: 1506.0 +[2023-09-14 14:44:50,637][63735] Sum rewards: -3.105, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.718', 'AMMO2': '0.012', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'weapon5': '0.028', 'ARMOR': '0.032', 'HITCOUNT': '0.050', 'weapon4': '0.052', 'AMMO4': '0.062', 'AMMO3': '0.129', 'DAMAGECOUNT': '0.150', 'WEAPON4': '0.150', 'WEAPON5': '0.250', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.542', 'weapon3': '1.668'} +[2023-09-14 14:44:51,016][63735] DAMAGECOUNT value on done: 1714.0 +[2023-09-14 14:44:51,661][63734] DAMAGECOUNT value on done: 2357.0 +[2023-09-14 14:44:52,063][63734] DAMAGECOUNT value on done: 2081.0 +[2023-09-14 14:44:52,461][63454] Saving new best policy, reward=-4.940! +[2023-09-14 14:44:53,151][63806] DAMAGECOUNT value on done: 2000.0 +[2023-09-14 14:44:53,480][63806] DAMAGECOUNT value on done: 1432.0 +[2023-09-14 14:44:53,744][63733] Updated weights for policy 1, policy_version 680 (0.0011) +[2023-09-14 14:44:54,784][63732] Updated weights for policy 0, policy_version 680 (0.0011) +[2023-09-14 14:44:55,089][63769] DAMAGECOUNT value on done: 1676.0 +[2023-09-14 14:44:55,090][63769] Sum rewards: -4.103, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.127', 'AMMO4': '-0.000', 'AMMO2': '0.000', 'AMMO5': '0.009', 'weapon4': '0.012', 'WEAPON1': '0.020', 'weapon5': '0.024', 'ARMOR': '0.032', 'WEAPON4': '0.100', 'AMMO3': '0.116', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.585', 'weapon2': '1.476', 'weapon3': '1.520'} +[2023-09-14 14:44:55,315][63771] DAMAGECOUNT value on done: 1534.0 +[2023-09-14 14:44:55,316][63771] Sum rewards: 0.267, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.850', 'AMMO5': '0.003', 'weapon5': '0.010', 'AMMO2': '0.012', 'WEAPON1': '0.030', 'WEAPON5': '0.050', 'AMMO4': '0.059', 'weapon4': '0.090', 'WEAPON4': '0.100', 'weapon7': '0.110', 'HITCOUNT': '0.120', 'AMMO3': '0.148', 'AMMO6': '0.320', 'AMMO7': '0.320', 'WEAPON7': '0.400', 'DAMAGECOUNT': '0.525', 'WEAPON3': '0.700', 'weapon3': '1.236', 'weapon2': '1.634', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:44:55,526][63769] DAMAGECOUNT value on done: 1843.0 +[2023-09-14 14:44:55,526][63769] Sum rewards: -2.946, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.726', 'AMMO5': '0.010', 'AMMO2': '0.015', 'weapon5': '0.030', 'AMMO4': '0.076', 'weapon7': '0.084', 'WEAPON5': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.126', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.204', 'HITCOUNT': '0.260', 'ARMOR': '0.424', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.230', 'weapon2': '1.430', 'FRAGCOUNT': '1.500', 'weapon3': '1.600'} +[2023-09-14 14:44:55,596][63770] DAMAGECOUNT value on done: 2163.0 +[2023-09-14 14:44:55,597][63770] Sum rewards: -4.137, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.980', 'AMMO2': '0.003', 'AMMO4': '0.015', 'AMMO5': '0.017', 'ARMOR': '0.028', 'AMMO3': '0.103', 'HITCOUNT': '0.180', 'weapon5': '0.196', 'WEAPON5': '0.450', 'WEAPON3': '0.550', 'weapon2': '1.482', 'DAMAGECOUNT': '1.494', 'weapon3': '1.574', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:44:55,714][63771] DAMAGECOUNT value on done: 1838.0 +[2023-09-14 14:44:55,715][63771] Sum rewards: -1.272, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.740', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.005', 'weapon5': '0.008', 'WEAPON5': '0.050', 'AMMO3': '0.091', 'HITCOUNT': '0.140', 'WEAPON3': '0.300', 'ARMOR': '0.454', 'DAMAGECOUNT': '0.588', 'weapon2': '1.288', 'weapon3': '1.290', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:44:56,005][63770] DAMAGECOUNT value on done: 1801.0 +[2023-09-14 14:44:56,006][63770] Sum rewards: -4.617, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.640', 'AMMO2': '0.020', 'weapon4': '0.030', 'ARMOR': '0.032', 'AMMO4': '0.097', 'WEAPON4': '0.100', 'HITCOUNT': '0.120', 'AMMO3': '0.150', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.900', 'weapon2': '1.134', 'weapon3': '1.740', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:44:56,172][63769] DAMAGECOUNT value on done: 2228.0 +[2023-09-14 14:44:56,173][63769] Sum rewards: -4.578, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.350', 'AMMO2': '0.006', 'AMMO5': '0.014', 'AMMO4': '0.032', 'WEAPON4': '0.050', 'weapon4': '0.056', 'weapon5': '0.072', 'AMMO3': '0.117', 'HITCOUNT': '0.190', 'WEAPON5': '0.300', 'ARMOR': '0.484', 'DAMAGECOUNT': '0.489', 'WEAPON3': '0.650', 'weapon2': '1.620', 'weapon3': '1.692'} +[2023-09-14 14:44:56,558][63769] DAMAGECOUNT value on done: 1325.0 +[2023-09-14 14:44:57,087][63806] DAMAGECOUNT value on done: 2298.0 +[2023-09-14 14:44:57,087][63806] Sum rewards: -4.104, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.111', 'AMMO5': '0.003', 'AMMO2': '0.004', 'AMMO4': '0.018', 'HITCOUNT': '0.080', 'AMMO3': '0.140', 'WEAPON4': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon4': '0.376', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.850', 'weapon2': '0.932', 'FRAGCOUNT': '1.000', 'weapon3': '1.620'} +[2023-09-14 14:44:57,466][63454] Saving new best policy, reward=-4.708! +[2023-09-14 14:44:57,485][63806] DAMAGECOUNT value on done: 2479.0 +[2023-09-14 14:44:57,486][63806] Sum rewards: -4.801, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.169', 'AMMO2': '0.011', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.054', 'AMMO3': '0.113', 'weapon5': '0.124', 'weapon4': '0.188', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'HITCOUNT': '0.250', 'WEAPON3': '0.700', 'ARMOR': '0.937', 'DAMAGECOUNT': '1.218', 'weapon3': '1.484', 'weapon2': '1.556', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:44:59,272][63735] DAMAGECOUNT value on done: 2452.0 +[2023-09-14 14:44:59,631][63735] DAMAGECOUNT value on done: 2415.0 +[2023-09-14 14:44:59,631][63735] Sum rewards: -5.277, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.086', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'AMMO2': '0.016', 'weapon5': '0.018', 'WEAPON5': '0.050', 'HITCOUNT': '0.080', 'AMMO4': '0.081', 'AMMO3': '0.129', 'WEAPON4': '0.200', 'weapon4': '0.236', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.750', 'weapon2': '1.158', 'weapon3': '1.536'} +[2023-09-14 14:45:00,280][63771] DAMAGECOUNT value on done: 1815.0 +[2023-09-14 14:45:00,281][63771] Sum rewards: 0.728, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.776', 'AMMO2': '0.008', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.020', 'AMMO4': '0.041', 'WEAPON4': '0.050', 'weapon5': '0.066', 'AMMO3': '0.140', 'HITCOUNT': '0.170', 'weapon4': '0.180', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.700', 'weapon2': '1.134', 'weapon3': '1.964', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:45:00,624][63771] DAMAGECOUNT value on done: 2963.0 +[2023-09-14 14:45:00,624][63771] Sum rewards: -4.282, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-1.030', 'AMMO5': '0.010', 'weapon5': '0.010', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'AMMO2': '0.034', 'AMMO3': '0.144', 'AMMO4': '0.172', 'WEAPON5': '0.200', 'weapon4': '0.200', 'HITCOUNT': '0.320', 'WEAPON4': '0.400', 'WEAPON3': '0.800', 'weapon2': '1.168', 'DAMAGECOUNT': '1.188', 'weapon3': '1.550', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:45:01,021][63733] Updated weights for policy 1, policy_version 690 (0.0010) +[2023-09-14 14:45:02,147][63732] Updated weights for policy 0, policy_version 690 (0.0010) +[2023-09-14 14:45:02,462][63454] Saving new best policy, reward=-4.648! +[2023-09-14 14:45:07,263][63770] DAMAGECOUNT value on done: 1435.0 +[2023-09-14 14:45:07,663][63770] DAMAGECOUNT value on done: 2126.0 +[2023-09-14 14:45:07,737][63733] Updated weights for policy 1, policy_version 700 (0.0011) +[2023-09-14 14:45:09,175][63767] DAMAGECOUNT value on done: 2409.0 +[2023-09-14 14:45:09,175][63767] Sum rewards: -5.735, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-1.344', 'weapon5': '0.014', 'AMMO5': '0.015', 'AMMO2': '0.015', 'AMMO4': '0.075', 'AMMO3': '0.202', 'WEAPON4': '0.250', 'weapon4': '0.282', 'HITCOUNT': '0.290', 'WEAPON5': '0.300', 'ARMOR': '0.451', 'weapon2': '0.952', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.140', 'FRAGCOUNT': '2.000', 'weapon3': '2.072'} +[2023-09-14 14:45:09,494][63767] DAMAGECOUNT value on done: 2171.0 +[2023-09-14 14:45:09,495][63767] Sum rewards: -3.132, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.024', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'WEAPON1': '0.020', 'weapon4': '0.020', 'AMMO5': '0.022', 'ARMOR': '0.024', 'WEAPON4': '0.050', 'weapon5': '0.078', 'AMMO3': '0.166', 'HITCOUNT': '0.290', 'WEAPON5': '0.350', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.044', 'weapon3': '1.386', 'weapon2': '1.808', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:45:09,883][63732] Updated weights for policy 0, policy_version 700 (0.0010) +[2023-09-14 14:45:09,975][63805] DAMAGECOUNT value on done: 1665.0 +[2023-09-14 14:45:09,976][63805] Sum rewards: -0.994, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.370', 'AMMO2': '0.006', 'AMMO5': '0.015', 'AMMO4': '0.027', 'WEAPON4': '0.050', 'weapon5': '0.050', 'HITCOUNT': '0.080', 'weapon4': '0.152', 'AMMO3': '0.165', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.255', 'ARMOR': '0.464', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.700', 'weapon2': '1.468', 'weapon3': '1.944'} +[2023-09-14 14:45:10,296][63734] DAMAGECOUNT value on done: 1776.0 +[2023-09-14 14:45:10,309][63805] DAMAGECOUNT value on done: 2527.0 +[2023-09-14 14:45:10,309][63805] Sum rewards: -6.925, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.130', 'AMMO4': '-0.031', 'AMMO2': '-0.006', 'weapon7': '0.072', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.120', 'AMMO3': '0.155', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.048', 'weapon3': '1.562'} +[2023-09-14 14:45:10,682][63734] DAMAGECOUNT value on done: 2091.0 +[2023-09-14 14:45:10,683][63734] Sum rewards: -9.103, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.888', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'weapon5': '0.012', 'AMMO2': '0.018', 'weapon7': '0.054', 'HITCOUNT': '0.060', 'weapon4': '0.062', 'AMMO4': '0.090', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON5': '0.100', 'ARMOR': '0.111', 'DAMAGECOUNT': '0.165', 'WEAPON4': '0.200', 'AMMO3': '0.228', 'weapon2': '1.178', 'WEAPON3': '1.200', 'weapon3': '1.502'} +[2023-09-14 14:45:10,719][63767] DAMAGECOUNT value on done: 2750.0 +[2023-09-14 14:45:10,719][63767] Sum rewards: -1.961, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.780', 'AMMO2': '0.010', 'AMMO5': '0.032', 'AMMO4': '0.051', 'weapon4': '0.078', 'AMMO3': '0.083', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.132', 'HITCOUNT': '0.150', 'weapon7': '0.154', 'WEAPON5': '0.550', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.573', 'FRAGCOUNT': '1.000', 'weapon2': '1.084', 'weapon3': '1.472'} +[2023-09-14 14:45:11,046][63767] DAMAGECOUNT value on done: 2349.0 +[2023-09-14 14:45:11,047][63767] Sum rewards: -1.439, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.478', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'weapon4': '0.024', 'weapon5': '0.032', 'WEAPON4': '0.050', 'AMMO3': '0.130', 'weapon7': '0.176', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.230', 'WEAPON5': '0.250', 'ARMOR': '0.525', 'DAMAGECOUNT': '0.825', 'WEAPON3': '0.850', 'weapon3': '1.518', 'weapon2': '1.566', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:45:11,562][63805] DAMAGECOUNT value on done: 1686.0 +[2023-09-14 14:45:11,562][63805] Sum rewards: -0.990, reward structure: {'DEATHCOUNT': '-10.500', 'AMMO5': '0.015', 'weapon5': '0.024', 'AMMO2': '0.030', 'weapon7': '0.074', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'HEALTH': '0.122', 'weapon4': '0.124', 'AMMO3': '0.136', 'WEAPON4': '0.150', 'AMMO4': '0.150', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'ARMOR': '0.416', 'DAMAGECOUNT': '0.678', 'WEAPON3': '0.750', 'weapon2': '1.190', 'weapon3': '1.880', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:45:11,897][63805] DAMAGECOUNT value on done: 2286.0 +[2023-09-14 14:45:11,897][63805] Sum rewards: 3.566, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.773', 'AMMO4': '-0.003', 'AMMO2': '-0.000', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'WEAPON5': '0.050', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.140', 'weapon7': '0.220', 'HITCOUNT': '0.300', 'ARMOR': '0.400', 'WEAPON3': '0.600', 'weapon3': '1.310', 'DAMAGECOUNT': '1.329', 'weapon2': '1.680', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:45:12,461][63454] Saving new best policy, reward=-4.503! +[2023-09-14 14:45:14,752][63733] Updated weights for policy 1, policy_version 710 (0.0011) +[2023-09-14 14:45:15,080][63735] DAMAGECOUNT value on done: 1691.0 +[2023-09-14 14:45:15,080][63735] Sum rewards: -5.723, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.829', 'weapon5': '0.014', 'AMMO2': '0.023', 'AMMO5': '0.028', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'weapon4': '0.054', 'AMMO4': '0.114', 'HITCOUNT': '0.150', 'AMMO3': '0.223', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.555', 'WEAPON3': '1.150', 'weapon2': '1.310', 'FRAGCOUNT': '2.000', 'weapon3': '2.050'} +[2023-09-14 14:45:15,513][63735] DAMAGECOUNT value on done: 1814.0 +[2023-09-14 14:45:15,652][63806] DAMAGECOUNT value on done: 2154.0 +[2023-09-14 14:45:16,027][63806] DAMAGECOUNT value on done: 1533.0 +[2023-09-14 14:45:16,027][63806] Sum rewards: -3.309, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.096', 'AMMO2': '0.008', 'AMMO5': '0.010', 'AMMO4': '0.037', 'HITCOUNT': '0.070', 'ARMOR': '0.072', 'WEAPON5': '0.100', 'AMMO3': '0.111', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.303', 'weapon4': '0.620', 'WEAPON3': '0.700', 'weapon2': '0.942', 'FRAGCOUNT': '1.000', 'weapon3': '1.264'} +[2023-09-14 14:45:16,652][63734] DAMAGECOUNT value on done: 2682.0 +[2023-09-14 14:45:16,653][63734] Sum rewards: 0.937, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.003', 'AMMO2': '0.009', 'weapon5': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.044', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'weapon4': '0.088', 'AMMO3': '0.115', 'HITCOUNT': '0.280', 'WEAPON3': '0.550', 'HEALTH': '0.598', 'DAMAGECOUNT': '0.975', 'FRAGCOUNT': '1.000', 'weapon2': '1.212', 'weapon3': '1.944'} +[2023-09-14 14:45:17,122][63734] DAMAGECOUNT value on done: 2081.0 +[2023-09-14 14:45:17,466][63454] Saving new best policy, reward=-4.461! +[2023-09-14 14:45:17,762][63732] Updated weights for policy 0, policy_version 710 (0.0011) +[2023-09-14 14:45:20,391][63769] DAMAGECOUNT value on done: 1891.0 +[2023-09-14 14:45:20,644][63771] DAMAGECOUNT value on done: 1802.0 +[2023-09-14 14:45:20,645][63771] Sum rewards: -2.647, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.407', 'AMMO5': '0.003', 'AMMO2': '0.034', 'WEAPON5': '0.050', 'weapon7': '0.058', 'AMMO3': '0.171', 'AMMO4': '0.172', 'weapon4': '0.182', 'HITCOUNT': '0.280', 'AMMO6': '0.300', 'WEAPON7': '0.300', 'AMMO7': '0.300', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.804', 'WEAPON3': '0.950', 'weapon2': '1.192', 'weapon3': '1.864', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:45:20,785][63769] DAMAGECOUNT value on done: 1983.0 +[2023-09-14 14:45:20,785][63769] Sum rewards: -3.061, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.516', 'weapon4': '0.010', 'AMMO2': '0.015', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.060', 'AMMO4': '0.074', 'weapon5': '0.076', 'WEAPON4': '0.100', 'HITCOUNT': '0.130', 'AMMO3': '0.151', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.750', 'weapon2': '1.646', 'weapon3': '1.738', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:45:20,988][63770] DAMAGECOUNT value on done: 2307.0 +[2023-09-14 14:45:21,044][63771] DAMAGECOUNT value on done: 1928.0 +[2023-09-14 14:45:21,044][63771] Sum rewards: -3.855, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.455', 'AMMO5': '0.003', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'weapon5': '0.022', 'ARMOR': '0.024', 'AMMO4': '0.043', 'WEAPON5': '0.050', 'HITCOUNT': '0.080', 'AMMO3': '0.122', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.700', 'weapon2': '0.876', 'FRAGCOUNT': '1.000', 'weapon3': '1.642'} +[2023-09-14 14:45:21,389][63770] DAMAGECOUNT value on done: 1901.0 +[2023-09-14 14:45:21,390][63770] Sum rewards: -6.911, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.030', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'ARMOR': '0.037', 'HITCOUNT': '0.090', 'AMMO3': '0.176', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.194', 'weapon3': '1.918'} +[2023-09-14 14:45:21,442][63769] DAMAGECOUNT value on done: 2346.0 +[2023-09-14 14:45:21,805][63733] Updated weights for policy 1, policy_version 720 (0.0011) +[2023-09-14 14:45:21,807][63806] DAMAGECOUNT value on done: 2563.0 +[2023-09-14 14:45:21,807][63806] Sum rewards: 0.754, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.418', 'AMMO2': '0.011', 'AMMO4': '0.056', 'ARMOR': '0.076', 'AMMO3': '0.095', 'WEAPON4': '0.100', 'HITCOUNT': '0.170', 'weapon4': '0.206', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.795', 'FRAGCOUNT': '1.000', 'weapon2': '1.158', 'weapon3': '1.504'} +[2023-09-14 14:45:21,887][63769] DAMAGECOUNT value on done: 1550.0 +[2023-09-14 14:45:21,887][63769] Sum rewards: -0.364, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.599', 'weapon5': '0.006', 'AMMO5': '0.007', 'AMMO2': '0.020', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'weapon4': '0.052', 'AMMO3': '0.091', 'AMMO4': '0.097', 'WEAPON4': '0.200', 'HITCOUNT': '0.210', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.675', 'weapon2': '0.908', 'weapon3': '1.824', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:45:22,040][63735] DAMAGECOUNT value on done: 2767.0 +[2023-09-14 14:45:22,041][63735] Sum rewards: -1.148, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.488', 'weapon5': '0.002', 'AMMO2': '0.004', 'AMMO5': '0.010', 'weapon4': '0.018', 'AMMO4': '0.019', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'AMMO3': '0.076', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.945', 'weapon3': '1.380', 'weapon2': '1.480', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:45:22,151][63806] DAMAGECOUNT value on done: 2534.0 +[2023-09-14 14:45:22,152][63806] Sum rewards: -9.042, reward structure: {'DEATHCOUNT': '-11.250', 'FRAGCOUNT': '-2.000', 'HEALTH': '-1.797', 'WEAPON1': '0.010', 'AMMO2': '0.012', 'AMMO5': '0.023', 'weapon4': '0.040', 'WEAPON4': '0.050', 'AMMO4': '0.058', 'HITCOUNT': '0.060', 'weapon5': '0.154', 'DAMAGECOUNT': '0.165', 'AMMO3': '0.198', 'ARMOR': '0.476', 'WEAPON5': '0.500', 'WEAPON3': '1.150', 'weapon2': '1.228', 'weapon3': '1.880'} +[2023-09-14 14:45:22,442][63735] DAMAGECOUNT value on done: 2615.0 +[2023-09-14 14:45:22,443][63735] Sum rewards: 0.365, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.003', 'AMMO2': '0.011', 'AMMO4': '0.055', 'AMMO3': '0.088', 'ARMOR': '0.090', 'HEALTH': '0.090', 'WEAPON4': '0.150', 'HITCOUNT': '0.190', 'weapon4': '0.230', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.600', 'weapon2': '1.140', 'weapon3': '1.268', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:45:22,461][63576] Saving new best policy, reward=-5.212! +[2023-09-14 14:45:22,461][63454] Saving new best policy, reward=-4.443! +[2023-09-14 14:45:23,841][63771] DAMAGECOUNT value on done: 2030.0 +[2023-09-14 14:45:24,182][63771] DAMAGECOUNT value on done: 3063.0 +[2023-09-14 14:45:24,182][63771] Sum rewards: -7.987, reward structure: {'DEATHCOUNT': '-12.000', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'AMMO2': '0.012', 'weapon5': '0.014', 'WEAPON4': '0.050', 'AMMO4': '0.060', 'ARMOR': '0.064', 'HITCOUNT': '0.070', 'WEAPON5': '0.100', 'weapon4': '0.104', 'HEALTH': '0.108', 'AMMO3': '0.158', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.750', 'weapon2': '1.282', 'weapon3': '1.436'} +[2023-09-14 14:45:25,532][63732] Updated weights for policy 0, policy_version 720 (0.0010) +[2023-09-14 14:45:28,644][63733] Updated weights for policy 1, policy_version 730 (0.0010) +[2023-09-14 14:45:31,417][63767] DAMAGECOUNT value on done: 2538.0 +[2023-09-14 14:45:31,418][63767] Sum rewards: -6.250, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.802', 'AMMO5': '0.005', 'AMMO2': '0.017', 'AMMO4': '0.084', 'ARMOR': '0.089', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.116', 'WEAPON4': '0.200', 'weapon4': '0.260', 'DAMAGECOUNT': '0.387', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.062', 'weapon2': '1.432'} +[2023-09-14 14:45:31,794][63767] DAMAGECOUNT value on done: 2205.0 +[2023-09-14 14:45:31,795][63767] Sum rewards: -5.294, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.220', 'FRAGCOUNT': '-1.500', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'HITCOUNT': '0.040', 'WEAPON4': '0.050', 'weapon5': '0.068', 'DAMAGECOUNT': '0.102', 'weapon7': '0.122', 'AMMO3': '0.142', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.850', 'weapon2': '1.156', 'weapon3': '1.734'} +[2023-09-14 14:45:32,605][63770] DAMAGECOUNT value on done: 1585.0 +[2023-09-14 14:45:32,951][63767] DAMAGECOUNT value on done: 2902.0 +[2023-09-14 14:45:32,951][63767] Sum rewards: -7.121, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.915', 'AMMO5': '0.005', 'AMMO2': '0.015', 'ARMOR': '0.040', 'AMMO4': '0.075', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.234', 'DAMAGECOUNT': '0.456', 'FRAGCOUNT': '1.000', 'weapon2': '1.076', 'WEAPON3': '1.250', 'weapon3': '2.302'} +[2023-09-14 14:45:32,987][63770] DAMAGECOUNT value on done: 2296.0 +[2023-09-14 14:45:32,987][63770] Sum rewards: -2.554, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.310', 'AMMO2': '0.013', 'AMMO3': '0.062', 'AMMO4': '0.066', 'WEAPON4': '0.100', 'ARMOR': '0.121', 'HITCOUNT': '0.160', 'weapon4': '0.378', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.510', 'weapon3': '0.908', 'FRAGCOUNT': '1.000', 'weapon2': '1.038'} +[2023-09-14 14:45:33,258][63732] Updated weights for policy 0, policy_version 730 (0.0010) +[2023-09-14 14:45:33,338][63767] DAMAGECOUNT value on done: 2772.0 +[2023-09-14 14:45:33,338][63767] Sum rewards: 0.865, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.211', 'AMMO5': '0.008', 'AMMO2': '0.016', 'weapon4': '0.050', 'weapon5': '0.054', 'AMMO3': '0.080', 'AMMO4': '0.081', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.310', 'WEAPON3': '0.350', 'weapon3': '1.236', 'DAMAGECOUNT': '1.269', 'weapon2': '1.822', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:45:33,777][63734] DAMAGECOUNT value on done: 1953.0 +[2023-09-14 14:45:33,777][63734] Sum rewards: -8.828, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.156', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.007', 'weapon5': '0.010', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'ARMOR': '0.044', 'AMMO4': '0.059', 'AMMO3': '0.125', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.531', 'WEAPON3': '0.650', 'weapon3': '1.358', 'weapon2': '1.722'} +[2023-09-14 14:45:34,126][63734] DAMAGECOUNT value on done: 2262.0 +[2023-09-14 14:45:34,127][63734] Sum rewards: -2.527, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.016', 'AMMO2': '0.003', 'AMMO4': '0.016', 'WEAPON1': '0.020', 'ARMOR': '0.080', 'HITCOUNT': '0.120', 'AMMO3': '0.129', 'DAMAGECOUNT': '0.513', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.056', 'weapon3': '1.602'} +[2023-09-14 14:45:34,279][63805] DAMAGECOUNT value on done: 1831.0 +[2023-09-14 14:45:34,591][63805] DAMAGECOUNT value on done: 2401.0 +[2023-09-14 14:45:34,772][63805] DAMAGECOUNT value on done: 1865.0 +[2023-09-14 14:45:34,772][63805] Sum rewards: -5.328, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.486', 'AMMO5': '0.015', 'AMMO2': '0.015', 'weapon5': '0.048', 'weapon7': '0.048', 'AMMO4': '0.076', 'HITCOUNT': '0.080', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'AMMO3': '0.197', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon4': '0.204', 'DAMAGECOUNT': '0.600', 'WEAPON3': '1.050', 'weapon2': '1.174', 'weapon3': '1.750', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:45:35,209][63805] DAMAGECOUNT value on done: 2733.0 +[2023-09-14 14:45:35,209][63805] Sum rewards: -1.319, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.343', 'AMMO5': '0.003', 'weapon4': '0.004', 'AMMO2': '0.007', 'AMMO4': '0.035', 'WEAPON5': '0.050', 'weapon7': '0.058', 'ARMOR': '0.084', 'AMMO3': '0.091', 'WEAPON4': '0.100', 'HITCOUNT': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.618', 'weapon2': '0.976', 'FRAGCOUNT': '1.000', 'weapon3': '1.498'} +[2023-09-14 14:45:35,486][63733] Updated weights for policy 1, policy_version 740 (0.0011) +[2023-09-14 14:45:37,466][63576] Saving new best policy, reward=-5.125! +[2023-09-14 14:45:37,466][63454] Saving new best policy, reward=-4.362! +[2023-09-14 14:45:38,626][63806] DAMAGECOUNT value on done: 2318.0 +[2023-09-14 14:45:38,626][63806] Sum rewards: -5.556, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.045', 'AMMO2': '0.004', 'weapon5': '0.008', 'AMMO4': '0.019', 'AMMO5': '0.020', 'AMMO3': '0.098', 'WEAPON4': '0.100', 'weapon4': '0.124', 'HITCOUNT': '0.140', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.492', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.314', 'weapon3': '1.320'} +[2023-09-14 14:45:39,019][63806] DAMAGECOUNT value on done: 1668.0 +[2023-09-14 14:45:39,020][63806] Sum rewards: -4.915, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.700', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.007', 'AMMO2': '0.008', 'ARMOR': '0.020', 'weapon5': '0.024', 'AMMO4': '0.039', 'HITCOUNT': '0.080', 'AMMO3': '0.105', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.550', 'weapon3': '0.888', 'weapon2': '1.508'} +[2023-09-14 14:45:39,709][63735] DAMAGECOUNT value on done: 1735.0 +[2023-09-14 14:45:40,032][63735] DAMAGECOUNT value on done: 2062.0 +[2023-09-14 14:45:40,033][63735] Sum rewards: -8.941, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.735', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.008', 'AMMO5': '0.010', 'AMMO4': '0.042', 'WEAPON4': '0.050', 'weapon4': '0.050', 'weapon5': '0.054', 'ARMOR': '0.060', 'AMMO3': '0.114', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.744', 'weapon2': '1.116', 'weapon3': '1.696'} +[2023-09-14 14:45:40,805][63735] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:45:41,101][63732] Updated weights for policy 0, policy_version 740 (0.0011) +[2023-09-14 14:45:41,609][63734] DAMAGECOUNT value on done: 2785.0 +[2023-09-14 14:45:42,095][63734] DAMAGECOUNT value on done: 2191.0 +[2023-09-14 14:45:42,095][63734] Sum rewards: -4.871, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.412', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.052', 'ARMOR': '0.056', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'weapon4': '0.114', 'AMMO3': '0.156', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.850', 'weapon2': '1.050', 'weapon3': '1.508', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:45:42,412][63733] Updated weights for policy 1, policy_version 750 (0.0012) +[2023-09-14 14:45:42,461][63576] Saving new best policy, reward=-5.036! +[2023-09-14 14:45:44,755][63735] DAMAGECOUNT value on done: 2847.0 +[2023-09-14 14:45:44,755][63735] Sum rewards: -7.982, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.820', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'weapon5': '0.012', 'ARMOR': '0.033', 'AMMO2': '0.035', 'HITCOUNT': '0.070', 'AMMO3': '0.107', 'WEAPON5': '0.150', 'AMMO4': '0.172', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.240', 'weapon4': '0.384', 'WEAPON3': '0.450', 'weapon3': '0.582', 'weapon2': '1.636'} +[2023-09-14 14:45:45,035][63735] DAMAGECOUNT value on done: 2752.0 +[2023-09-14 14:45:45,036][63735] Sum rewards: -7.168, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-3.005', 'AMMO5': '0.005', 'AMMO2': '0.013', 'WEAPON1': '0.020', 'AMMO4': '0.064', 'HITCOUNT': '0.080', 'WEAPON5': '0.100', 'AMMO3': '0.156', 'weapon4': '0.156', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.411', 'weapon2': '0.822', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '1.610'} +[2023-09-14 14:45:45,586][63769] DAMAGECOUNT value on done: 1931.0 +[2023-09-14 14:45:45,910][63771] DAMAGECOUNT value on done: 1882.0 +[2023-09-14 14:45:45,910][63771] Sum rewards: -6.705, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.632', 'AMMO5': '0.003', 'ARMOR': '0.008', 'AMMO2': '0.012', 'weapon4': '0.012', 'WEAPON5': '0.050', 'AMMO4': '0.058', 'weapon7': '0.070', 'HITCOUNT': '0.080', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.148', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.240', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.424', 'weapon3': '1.682'} +[2023-09-14 14:45:46,029][63769] DAMAGECOUNT value on done: 2240.0 +[2023-09-14 14:45:46,030][63769] Sum rewards: -7.246, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.218', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.016', 'AMMO2': '0.020', 'weapon5': '0.034', 'AMMO4': '0.098', 'weapon4': '0.100', 'AMMO3': '0.146', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.771', 'WEAPON3': '0.850', 'weapon3': '1.356', 'weapon2': '1.626'} +[2023-09-14 14:45:46,204][63806] DAMAGECOUNT value on done: 2752.0 +[2023-09-14 14:45:46,255][63771] DAMAGECOUNT value on done: 2068.0 +[2023-09-14 14:45:46,273][63770] DAMAGECOUNT value on done: 2657.0 +[2023-09-14 14:45:46,273][63770] Sum rewards: 0.938, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.656', 'AMMO2': '0.010', 'AMMO5': '0.012', 'weapon5': '0.032', 'WEAPON4': '0.050', 'AMMO4': '0.051', 'ARMOR': '0.076', 'weapon4': '0.122', 'WEAPON5': '0.150', 'AMMO3': '0.160', 'HITCOUNT': '0.300', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.050', 'weapon2': '1.146', 'weapon3': '1.834', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:45:46,577][63806] DAMAGECOUNT value on done: 2989.0 +[2023-09-14 14:45:46,577][63806] Sum rewards: -4.645, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-3.230', 'AMMO4': '-0.031', 'AMMO2': '-0.006', 'WEAPON1': '0.020', 'weapon5': '0.032', 'AMMO5': '0.033', 'AMMO3': '0.215', 'HITCOUNT': '0.350', 'ARMOR': '0.410', 'WEAPON5': '0.450', 'weapon2': '0.894', 'DAMAGECOUNT': '1.365', 'WEAPON3': '1.400', 'weapon3': '2.454', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:45:46,623][63769] DAMAGECOUNT value on done: 2910.0 +[2023-09-14 14:45:46,623][63769] Sum rewards: 3.735, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.320', 'AMMO5': '0.005', 'AMMO2': '0.005', 'AMMO4': '0.026', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.103', 'weapon7': '0.270', 'HITCOUNT': '0.330', 'ARMOR': '0.448', 'WEAPON3': '0.550', 'weapon2': '1.482', 'weapon3': '1.594', 'DAMAGECOUNT': '1.692', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:45:46,680][63770] DAMAGECOUNT value on done: 1996.0 +[2023-09-14 14:45:46,680][63770] Sum rewards: -3.046, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.760', 'AMMO5': '0.005', 'AMMO2': '0.005', 'weapon5': '0.008', 'weapon7': '0.026', 'AMMO4': '0.027', 'ARMOR': '0.060', 'WEAPON5': '0.100', 'weapon4': '0.104', 'AMMO3': '0.106', 'HITCOUNT': '0.120', 'WEAPON4': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.650', 'weapon3': '0.974', 'FRAGCOUNT': '1.000', 'weapon2': '1.244'} +[2023-09-14 14:45:46,958][63769] DAMAGECOUNT value on done: 1615.0 +[2023-09-14 14:45:46,959][63769] Sum rewards: -7.573, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.460', 'AMMO2': '0.001', 'AMMO5': '0.005', 'AMMO4': '0.006', 'WEAPON1': '0.020', 'weapon5': '0.028', 'WEAPON4': '0.050', 'weapon4': '0.064', 'HITCOUNT': '0.070', 'WEAPON5': '0.100', 'AMMO3': '0.158', 'DAMAGECOUNT': '0.195', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.184', 'weapon2': '1.506'} +[2023-09-14 14:45:47,300][63771] DAMAGECOUNT value on done: 2090.0 +[2023-09-14 14:45:47,301][63771] Sum rewards: -6.474, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.180', 'AMMO5': '0.005', 'AMMO2': '0.014', 'weapon5': '0.018', 'ARMOR': '0.024', 'HITCOUNT': '0.060', 'AMMO4': '0.070', 'WEAPON5': '0.100', 'AMMO3': '0.165', 'DAMAGECOUNT': '0.180', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.264', 'weapon2': '1.506'} +[2023-09-14 14:45:47,467][63454] Saving new best policy, reward=-4.339! +[2023-09-14 14:45:47,623][63771] DAMAGECOUNT value on done: 3088.0 +[2023-09-14 14:45:47,624][63771] Sum rewards: -4.326, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.130', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'weapon5': '0.010', 'AMMO2': '0.019', 'HITCOUNT': '0.020', 'WEAPON5': '0.050', 'ARMOR': '0.072', 'DAMAGECOUNT': '0.075', 'AMMO4': '0.096', 'AMMO3': '0.135', 'WEAPON4': '0.200', 'weapon4': '0.224', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.146', 'weapon3': '1.244'} +[2023-09-14 14:45:48,942][63732] Updated weights for policy 0, policy_version 750 (0.0011) +[2023-09-14 14:45:49,331][63733] Updated weights for policy 1, policy_version 760 (0.0011) +[2023-09-14 14:45:53,751][63767] DAMAGECOUNT value on done: 3098.0 +[2023-09-14 14:45:53,752][63767] Sum rewards: 1.111, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.220', 'weapon4': '0.010', 'AMMO5': '0.017', 'AMMO2': '0.023', 'AMMO3': '0.094', 'WEAPON4': '0.100', 'AMMO4': '0.113', 'weapon5': '0.248', 'HITCOUNT': '0.260', 'WEAPON5': '0.350', 'WEAPON3': '0.500', 'weapon3': '1.264', 'weapon2': '1.672', 'DAMAGECOUNT': '1.680', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:45:54,065][63767] DAMAGECOUNT value on done: 2455.0 +[2023-09-14 14:45:54,065][63767] Sum rewards: -2.734, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.660', 'AMMO4': '-0.018', 'AMMO2': '-0.003', 'AMMO5': '0.010', 'ARMOR': '0.124', 'AMMO3': '0.139', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.750', 'weapon2': '1.136', 'weapon3': '1.678', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:45:55,331][63767] DAMAGECOUNT value on done: 3007.0 +[2023-09-14 14:45:55,332][63767] Sum rewards: -6.893, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.386', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.056', 'HITCOUNT': '0.110', 'weapon5': '0.164', 'AMMO3': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.315', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.432', 'weapon2': '1.900'} +[2023-09-14 14:45:55,657][63767] DAMAGECOUNT value on done: 3374.0 +[2023-09-14 14:45:55,658][63767] Sum rewards: 0.375, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.476', 'AMMO4': '-0.038', 'AMMO2': '-0.008', 'ARMOR': '0.020', 'AMMO5': '0.022', 'weapon5': '0.066', 'AMMO3': '0.122', 'WEAPON5': '0.300', 'HITCOUNT': '0.340', 'WEAPON3': '0.700', 'weapon2': '1.418', 'DAMAGECOUNT': '1.806', 'weapon3': '1.852', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:45:56,305][63733] Updated weights for policy 1, policy_version 770 (0.0011) +[2023-09-14 14:45:56,669][63732] Updated weights for policy 0, policy_version 760 (0.0011) +[2023-09-14 14:45:57,033][63805] DAMAGECOUNT value on done: 2035.0 +[2023-09-14 14:45:57,363][63734] DAMAGECOUNT value on done: 1968.0 +[2023-09-14 14:45:57,387][63805] DAMAGECOUNT value on done: 2630.0 +[2023-09-14 14:45:57,388][63805] Sum rewards: -4.904, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.357', 'AMMO2': '0.008', 'AMMO5': '0.013', 'AMMO4': '0.039', 'weapon5': '0.058', 'ARMOR': '0.068', 'AMMO3': '0.140', 'HITCOUNT': '0.170', 'WEAPON5': '0.300', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.687', 'WEAPON3': '0.850', 'weapon2': '1.480', 'weapon3': '1.890'} +[2023-09-14 14:45:57,498][63454] Saving new best policy, reward=-4.306! +[2023-09-14 14:45:57,758][63734] DAMAGECOUNT value on done: 2592.0 +[2023-09-14 14:45:57,759][63734] Sum rewards: -3.949, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.010', 'ARMOR': '0.024', 'weapon5': '0.038', 'WEAPON4': '0.050', 'AMMO4': '0.050', 'AMMO3': '0.074', 'weapon4': '0.098', 'WEAPON5': '0.150', 'HITCOUNT': '0.220', 'HEALTH': '0.330', 'WEAPON3': '0.400', 'weapon3': '0.934', 'DAMAGECOUNT': '0.990', 'weapon2': '1.412'} +[2023-09-14 14:45:58,029][63770] DAMAGECOUNT value on done: 1705.0 +[2023-09-14 14:45:58,030][63770] Sum rewards: 2.377, reward structure: {'DEATHCOUNT': '-1.500', 'HEALTH': '-0.431', 'AMMO4': '-0.034', 'AMMO2': '-0.007', 'HITCOUNT': '0.070', 'AMMO3': '0.076', 'WEAPON3': '0.250', 'DAMAGECOUNT': '0.360', 'ARMOR': '0.477', 'weapon2': '0.574', 'FRAGCOUNT': '1.000', 'weapon3': '1.542'} +[2023-09-14 14:45:58,495][63770] DAMAGECOUNT value on done: 2366.0 +[2023-09-14 14:45:58,495][63770] Sum rewards: -1.133, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.717', 'AMMO2': '0.000', 'AMMO4': '0.001', 'weapon5': '0.008', 'AMMO5': '0.010', 'weapon4': '0.022', 'WEAPON4': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.093', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.400', 'ARMOR': '0.484', 'FRAGCOUNT': '1.000', 'weapon2': '1.114', 'weapon3': '1.282'} +[2023-09-14 14:45:59,636][63805] DAMAGECOUNT value on done: 2320.0 +[2023-09-14 14:45:59,636][63805] Sum rewards: -5.170, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.706', 'AMMO4': '-0.020', 'AMMO2': '-0.004', 'AMMO5': '0.008', 'weapon5': '0.028', 'WEAPON1': '0.030', 'WEAPON5': '0.150', 'AMMO3': '0.191', 'HITCOUNT': '0.300', 'ARMOR': '0.472', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.332', 'DAMAGECOUNT': '1.365', 'weapon2': '1.934'} +[2023-09-14 14:46:00,046][63805] DAMAGECOUNT value on done: 3018.0 +[2023-09-14 14:46:00,047][63805] Sum rewards: -1.503, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.368', 'AMMO2': '0.011', 'AMMO4': '0.055', 'AMMO3': '0.107', 'HITCOUNT': '0.260', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.855', 'weapon2': '0.900', 'weapon3': '2.226', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:46:01,727][63806] DAMAGECOUNT value on done: 2646.0 +[2023-09-14 14:46:01,727][63806] Sum rewards: -0.276, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.793', 'AMMO2': '0.009', 'AMMO5': '0.010', 'AMMO4': '0.046', 'weapon7': '0.068', 'AMMO3': '0.092', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.124', 'HITCOUNT': '0.220', 'WEAPON3': '0.450', 'ARMOR': '0.536', 'DAMAGECOUNT': '0.984', 'weapon2': '1.082', 'weapon3': '1.146', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:46:02,008][63805] Large shaping reward 2.632 for [('FRAGCOUNT', 2.0, 2.0), ('HITCOUNT', 0.03, 3.0), ('DAMAGECOUNT', 0.6, 200), ('weapon7', 0.002)] +[2023-09-14 14:46:02,115][63806] DAMAGECOUNT value on done: 1703.0 +[2023-09-14 14:46:02,461][63454] Saving new best policy, reward=-4.244! +[2023-09-14 14:46:02,461][63576] Saving new best policy, reward=-4.868! +[2023-09-14 14:46:03,347][63733] Updated weights for policy 1, policy_version 780 (0.0011) +[2023-09-14 14:46:04,356][63735] DAMAGECOUNT value on done: 1939.0 +[2023-09-14 14:46:04,357][63735] Sum rewards: -3.711, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.897', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'WEAPON1': '0.010', 'AMMO5': '0.025', 'ARMOR': '0.048', 'weapon5': '0.110', 'HITCOUNT': '0.170', 'AMMO3': '0.175', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.612', 'WEAPON3': '0.900', 'weapon2': '1.292', 'weapon3': '1.702', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:46:04,576][63732] Updated weights for policy 0, policy_version 770 (0.0011) +[2023-09-14 14:46:04,780][63735] DAMAGECOUNT value on done: 2110.0 +[2023-09-14 14:46:04,780][63735] Sum rewards: 0.499, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-0.386', 'AMMO2': '0.017', 'HITCOUNT': '0.040', 'AMMO3': '0.079', 'AMMO4': '0.085', 'ARMOR': '0.112', 'DAMAGECOUNT': '0.144', 'WEAPON4': '0.150', 'WEAPON3': '0.400', 'weapon4': '0.498', 'weapon3': '0.768', 'FRAGCOUNT': '1.000', 'weapon2': '1.342'} +[2023-09-14 14:46:07,113][63734] DAMAGECOUNT value on done: 2955.0 +[2023-09-14 14:46:07,466][63454] Saving new best policy, reward=-4.225! +[2023-09-14 14:46:07,480][63576] Saving new best policy, reward=-4.761! +[2023-09-14 14:46:07,560][63734] DAMAGECOUNT value on done: 2218.0 +[2023-09-14 14:46:07,707][63735] DAMAGECOUNT value on done: 2862.0 +[2023-09-14 14:46:07,708][63735] Sum rewards: -7.377, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.150', 'AMMO5': '0.005', 'AMMO2': '0.007', 'HITCOUNT': '0.020', 'weapon4': '0.024', 'AMMO4': '0.033', 'DAMAGECOUNT': '0.045', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'AMMO3': '0.153', 'WEAPON3': '0.700', 'ARMOR': '0.812', 'weapon3': '0.998', 'FRAGCOUNT': '1.000', 'weapon2': '1.576'} +[2023-09-14 14:46:08,044][63735] DAMAGECOUNT value on done: 2772.0 +[2023-09-14 14:46:10,301][63733] Updated weights for policy 1, policy_version 790 (0.0009) +[2023-09-14 14:46:10,720][63806] DAMAGECOUNT value on done: 2764.0 +[2023-09-14 14:46:10,735][63771] DAMAGECOUNT value on done: 2160.0 +[2023-09-14 14:46:10,736][63771] Sum rewards: -4.433, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.126', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO4': '0.021', 'HITCOUNT': '0.060', 'ARMOR': '0.100', 'AMMO3': '0.143', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.800', 'weapon2': '0.924', 'weapon3': '1.920', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:46:11,087][63769] DAMAGECOUNT value on done: 2056.0 +[2023-09-14 14:46:11,088][63769] Sum rewards: -6.382, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.936', 'AMMO2': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.049', 'HITCOUNT': '0.070', 'WEAPON4': '0.100', 'weapon4': '0.148', 'AMMO3': '0.172', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.272', 'weapon3': '1.648'} +[2023-09-14 14:46:11,095][63771] DAMAGECOUNT value on done: 2133.0 +[2023-09-14 14:46:11,096][63771] Sum rewards: -8.785, reward structure: {'DEATHCOUNT': '-12.750', 'FRAGCOUNT': '-2.000', 'HEALTH': '-0.328', 'AMMO2': '0.008', 'AMMO5': '0.017', 'AMMO4': '0.038', 'weapon5': '0.098', 'HITCOUNT': '0.150', 'AMMO3': '0.167', 'WEAPON5': '0.250', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.753', 'ARMOR': '0.800', 'weapon2': '1.670', 'weapon3': '1.692'} +[2023-09-14 14:46:11,169][63771] DAMAGECOUNT value on done: 3303.0 +[2023-09-14 14:46:11,170][63771] Sum rewards: -5.427, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.685', 'AMMO2': '0.002', 'weapon5': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.009', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'weapon4': '0.126', 'AMMO3': '0.161', 'HITCOUNT': '0.190', 'ARMOR': '0.432', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.068', 'weapon3': '1.418'} +[2023-09-14 14:46:11,182][63806] DAMAGECOUNT value on done: 3199.0 +[2023-09-14 14:46:11,182][63806] Sum rewards: -5.983, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.609', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.020', 'AMMO2': '0.029', 'weapon5': '0.040', 'weapon4': '0.042', 'WEAPON4': '0.100', 'AMMO4': '0.144', 'AMMO3': '0.168', 'HITCOUNT': '0.180', 'WEAPON5': '0.250', 'ARMOR': '0.547', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.900', 'weapon2': '1.460', 'weapon3': '1.866'} +[2023-09-14 14:46:11,454][63769] DAMAGECOUNT value on done: 2410.0 +[2023-09-14 14:46:11,454][63769] Sum rewards: -2.315, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.692', 'AMMO2': '0.012', 'weapon4': '0.018', 'weapon5': '0.034', 'AMMO5': '0.035', 'ARMOR': '0.042', 'AMMO4': '0.059', 'HITCOUNT': '0.150', 'AMMO3': '0.163', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.152', 'weapon3': '2.202'} +[2023-09-14 14:46:11,490][63771] DAMAGECOUNT value on done: 2153.0 +[2023-09-14 14:46:11,889][63770] DAMAGECOUNT value on done: 2955.0 +[2023-09-14 14:46:11,890][63770] Sum rewards: -2.897, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.750', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.011', 'WEAPON1': '0.020', 'AMMO5': '0.022', 'ARMOR': '0.035', 'weapon5': '0.038', 'AMMO4': '0.052', 'AMMO3': '0.119', 'HITCOUNT': '0.270', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.894', 'weapon2': '1.194', 'weapon3': '1.998'} +[2023-09-14 14:46:12,105][63769] DAMAGECOUNT value on done: 3040.0 +[2023-09-14 14:46:12,250][63770] DAMAGECOUNT value on done: 2086.0 +[2023-09-14 14:46:12,251][63770] Sum rewards: -0.213, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.124', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.011', 'ARMOR': '0.044', 'AMMO3': '0.085', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.450', 'weapon2': '1.304', 'weapon3': '1.540', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:46:12,463][63454] Saving new best policy, reward=-4.181! +[2023-09-14 14:46:12,465][63732] Updated weights for policy 0, policy_version 780 (0.0010) +[2023-09-14 14:46:12,541][63769] DAMAGECOUNT value on done: 1781.0 +[2023-09-14 14:46:12,541][63769] Sum rewards: -3.008, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.876', 'AMMO2': '0.019', 'weapon4': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.095', 'WEAPON4': '0.100', 'AMMO3': '0.105', 'HITCOUNT': '0.130', 'DAMAGECOUNT': '0.498', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.014', 'weapon3': '1.704'} +[2023-09-14 14:46:16,269][63767] DAMAGECOUNT value on done: 3350.0 +[2023-09-14 14:46:16,270][63767] Sum rewards: -4.001, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.800', 'weapon5': '0.006', 'AMMO5': '0.007', 'AMMO2': '0.038', 'AMMO3': '0.078', 'WEAPON5': '0.100', 'ARMOR': '0.129', 'HITCOUNT': '0.160', 'weapon4': '0.176', 'AMMO4': '0.188', 'WEAPON3': '0.500', 'WEAPON4': '0.500', 'DAMAGECOUNT': '0.756', 'weapon3': '0.940', 'FRAGCOUNT': '1.000', 'weapon2': '1.470'} +[2023-09-14 14:46:16,621][63767] DAMAGECOUNT value on done: 2881.0 +[2023-09-14 14:46:16,622][63767] Sum rewards: -0.259, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.745', 'AMMO2': '0.018', 'AMMO5': '0.019', 'weapon5': '0.042', 'AMMO4': '0.088', 'weapon4': '0.094', 'AMMO3': '0.154', 'WEAPON4': '0.200', 'HITCOUNT': '0.310', 'WEAPON5': '0.400', 'WEAPON3': '0.850', 'weapon2': '1.100', 'DAMAGECOUNT': '1.278', 'weapon3': '2.182', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:46:17,252][63733] Updated weights for policy 1, policy_version 800 (0.0010) +[2023-09-14 14:46:17,466][63454] Saving new best policy, reward=-4.119! +[2023-09-14 14:46:17,862][63767] DAMAGECOUNT value on done: 3380.0 +[2023-09-14 14:46:17,862][63767] Sum rewards: -1.411, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.610', 'ARMOR': '0.008', 'AMMO2': '0.010', 'AMMO5': '0.010', 'AMMO4': '0.048', 'AMMO3': '0.082', 'weapon5': '0.094', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.180', 'weapon4': '0.230', 'WEAPON3': '0.500', 'weapon3': '0.984', 'DAMAGECOUNT': '1.119', 'weapon2': '1.884', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:46:18,218][63767] DAMAGECOUNT value on done: 3504.0 +[2023-09-14 14:46:18,219][63767] Sum rewards: -2.843, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.900', 'AMMO5': '0.012', 'AMMO2': '0.021', 'weapon5': '0.048', 'AMMO3': '0.084', 'HITCOUNT': '0.100', 'AMMO4': '0.103', 'weapon4': '0.104', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.162', 'weapon3': '1.782'} +[2023-09-14 14:46:19,963][63805] DAMAGECOUNT value on done: 2409.0 +[2023-09-14 14:46:19,964][63805] Sum rewards: -5.202, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.000', 'HEALTH': '-0.642', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'AMMO5': '0.013', 'weapon4': '0.042', 'WEAPON4': '0.050', 'AMMO4': '0.053', 'AMMO3': '0.093', 'HITCOUNT': '0.160', 'weapon5': '0.174', 'WEAPON5': '0.200', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.122', 'weapon2': '1.316', 'weapon3': '1.546'} +[2023-09-14 14:46:20,258][63732] Updated weights for policy 0, policy_version 790 (0.0010) +[2023-09-14 14:46:20,356][63805] DAMAGECOUNT value on done: 2950.0 +[2023-09-14 14:46:20,356][63805] Sum rewards: 0.160, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.488', 'AMMO5': '0.005', 'weapon5': '0.016', 'AMMO2': '0.018', 'WEAPON5': '0.050', 'weapon7': '0.060', 'AMMO4': '0.091', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'ARMOR': '0.108', 'HITCOUNT': '0.120', 'AMMO3': '0.126', 'WEAPON4': '0.200', 'weapon4': '0.312', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.945', 'weapon3': '1.100', 'weapon2': '1.296', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:46:20,950][63734] DAMAGECOUNT value on done: 2031.0 +[2023-09-14 14:46:21,294][63734] DAMAGECOUNT value on done: 2601.0 +[2023-09-14 14:46:22,461][63454] Saving new best policy, reward=-3.983! +[2023-09-14 14:46:23,774][63770] DAMAGECOUNT value on done: 1817.0 +[2023-09-14 14:46:23,775][63770] Sum rewards: -2.323, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.696', 'ARMOR': '0.008', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.023', 'HITCOUNT': '0.050', 'weapon5': '0.082', 'AMMO4': '0.115', 'weapon4': '0.126', 'AMMO3': '0.140', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.336', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.320', 'weapon3': '1.602'} +[2023-09-14 14:46:24,124][63770] DAMAGECOUNT value on done: 2441.0 +[2023-09-14 14:46:24,315][63733] Updated weights for policy 1, policy_version 810 (0.0011) +[2023-09-14 14:46:24,482][63806] DAMAGECOUNT value on done: 2721.0 +[2023-09-14 14:46:24,483][63806] Sum rewards: -4.631, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.460', 'AMMO5': '0.005', 'AMMO2': '0.008', 'weapon5': '0.018', 'AMMO4': '0.039', 'ARMOR': '0.044', 'HITCOUNT': '0.060', 'weapon4': '0.068', 'AMMO3': '0.076', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.225', 'WEAPON3': '0.400', 'weapon3': '0.674', 'weapon2': '1.762', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:46:24,676][63805] DAMAGECOUNT value on done: 2535.0 +[2023-09-14 14:46:24,823][63806] DAMAGECOUNT value on done: 1828.0 +[2023-09-14 14:46:25,155][63805] DAMAGECOUNT value on done: 3083.0 +[2023-09-14 14:46:25,155][63805] Sum rewards: -1.366, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.760', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'AMMO5': '0.005', 'WEAPON4': '0.050', 'HITCOUNT': '0.050', 'weapon4': '0.094', 'ARMOR': '0.096', 'WEAPON5': '0.100', 'AMMO3': '0.120', 'DAMAGECOUNT': '0.195', 'WEAPON3': '0.800', 'weapon2': '1.114', 'weapon3': '1.528', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:46:27,468][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000814_3334144.pth... +[2023-09-14 14:46:27,495][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000799_3272704.pth... +[2023-09-14 14:46:27,524][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000505_2068480.pth +[2023-09-14 14:46:27,532][63576] Saving new best policy, reward=-4.695! +[2023-09-14 14:46:27,567][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000447_1830912.pth +[2023-09-14 14:46:27,576][63454] Saving new best policy, reward=-3.942! +[2023-09-14 14:46:28,310][63732] Updated weights for policy 0, policy_version 800 (0.0012) +[2023-09-14 14:46:29,451][63735] DAMAGECOUNT value on done: 2197.0 +[2023-09-14 14:46:29,451][63735] Sum rewards: -2.832, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.468', 'AMMO5': '0.003', 'weapon5': '0.006', 'WEAPON1': '0.010', 'AMMO2': '0.020', 'WEAPON5': '0.050', 'ARMOR': '0.092', 'AMMO4': '0.099', 'AMMO3': '0.131', 'WEAPON4': '0.150', 'HITCOUNT': '0.180', 'weapon4': '0.206', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.774', 'weapon3': '0.996', 'weapon2': '1.320', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:46:29,846][63735] DAMAGECOUNT value on done: 2220.0 +[2023-09-14 14:46:29,847][63735] Sum rewards: -4.449, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.010', 'AMMO5': '0.010', 'weapon5': '0.010', 'AMMO2': '0.011', 'AMMO4': '0.052', 'weapon4': '0.064', 'WEAPON5': '0.100', 'HITCOUNT': '0.100', 'AMMO3': '0.128', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.082', 'weapon2': '1.324'} +[2023-09-14 14:46:30,959][63735] DAMAGECOUNT value on done: 3104.0 +[2023-09-14 14:46:30,960][63735] Sum rewards: -1.408, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.724', 'WEAPON1': '0.010', 'AMMO2': '0.019', 'AMMO4': '0.092', 'AMMO3': '0.121', 'HITCOUNT': '0.210', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.726', 'weapon3': '1.336', 'weapon2': '1.602', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:46:31,186][63733] Updated weights for policy 1, policy_version 820 (0.0012) +[2023-09-14 14:46:31,382][63735] DAMAGECOUNT value on done: 2895.0 +[2023-09-14 14:46:31,382][63735] Sum rewards: -4.250, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.412', 'AMMO4': '-0.010', 'AMMO2': '-0.002', 'AMMO5': '0.003', 'weapon5': '0.012', 'WEAPON5': '0.050', 'HITCOUNT': '0.110', 'ARMOR': '0.112', 'AMMO3': '0.158', 'DAMAGECOUNT': '0.369', 'WEAPON3': '0.900', 'weapon2': '0.996', 'FRAGCOUNT': '1.000', 'weapon3': '1.714'} +[2023-09-14 14:46:32,461][63576] Saving new best policy, reward=-4.588! +[2023-09-14 14:46:32,503][63734] DAMAGECOUNT value on done: 3209.0 +[2023-09-14 14:46:32,503][63734] Sum rewards: -6.547, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.488', 'AMMO5': '0.012', 'AMMO2': '0.020', 'weapon5': '0.080', 'AMMO4': '0.099', 'weapon4': '0.134', 'AMMO3': '0.146', 'WEAPON4': '0.150', 'HITCOUNT': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.762', 'WEAPON3': '0.850', 'weapon2': '1.440', 'weapon3': '1.548', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:46:32,930][63734] DAMAGECOUNT value on done: 2218.0 +[2023-09-14 14:46:34,095][63771] DAMAGECOUNT value on done: 2235.0 +[2023-09-14 14:46:34,095][63771] Sum rewards: -5.857, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.647', 'AMMO2': '0.016', 'ARMOR': '0.024', 'HITCOUNT': '0.070', 'weapon4': '0.078', 'AMMO4': '0.082', 'WEAPON4': '0.150', 'AMMO3': '0.153', 'DAMAGECOUNT': '0.225', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.122', 'weapon3': '1.670'} +[2023-09-14 14:46:34,474][63771] DAMAGECOUNT value on done: 3328.0 +[2023-09-14 14:46:35,460][63806] DAMAGECOUNT value on done: 3024.0 +[2023-09-14 14:46:35,460][63806] Sum rewards: -1.744, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.310', 'AMMO2': '0.003', 'AMMO5': '0.010', 'weapon4': '0.014', 'AMMO4': '0.017', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.142', 'HITCOUNT': '0.180', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.780', 'weapon2': '1.268', 'weapon3': '1.502', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:46:35,823][63806] DAMAGECOUNT value on done: 3239.0 +[2023-09-14 14:46:36,000][63732] Updated weights for policy 0, policy_version 810 (0.0011) +[2023-09-14 14:46:36,146][63771] DAMAGECOUNT value on done: 2334.0 +[2023-09-14 14:46:36,146][63771] Sum rewards: -1.687, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO2': '0.007', 'AMMO5': '0.009', 'weapon5': '0.022', 'AMMO4': '0.036', 'ARMOR': '0.048', 'WEAPON4': '0.050', 'AMMO3': '0.117', 'HITCOUNT': '0.140', 'weapon4': '0.170', 'WEAPON5': '0.200', 'HEALTH': '0.280', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.603', 'FRAGCOUNT': '1.000', 'weapon2': '1.218', 'weapon3': '1.362'} +[2023-09-14 14:46:36,447][63771] DAMAGECOUNT value on done: 2218.0 +[2023-09-14 14:46:36,670][63769] DAMAGECOUNT value on done: 2141.0 +[2023-09-14 14:46:36,670][63769] Sum rewards: -7.430, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.629', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO2': '0.016', 'weapon4': '0.020', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'HITCOUNT': '0.070', 'AMMO4': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.179', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.390', 'weapon2': '1.444'} +[2023-09-14 14:46:37,124][63769] DAMAGECOUNT value on done: 2623.0 +[2023-09-14 14:46:37,125][63769] Sum rewards: -4.854, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.068', 'AMMO2': '0.022', 'ARMOR': '0.044', 'AMMO4': '0.108', 'AMMO3': '0.115', 'weapon4': '0.146', 'HITCOUNT': '0.180', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.639', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.130', 'weapon2': '1.830'} +[2023-09-14 14:46:37,468][63454] Saving new best policy, reward=-3.928! +[2023-09-14 14:46:37,718][63770] DAMAGECOUNT value on done: 3035.0 +[2023-09-14 14:46:37,719][63770] Sum rewards: -1.988, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.295', 'AMMO5': '0.007', 'AMMO2': '0.030', 'weapon7': '0.058', 'weapon4': '0.078', 'HITCOUNT': '0.080', 'AMMO3': '0.096', 'WEAPON5': '0.100', 'AMMO4': '0.148', 'DAMAGECOUNT': '0.240', 'WEAPON4': '0.250', 'AMMO6': '0.260', 'AMMO7': '0.260', 'WEAPON7': '0.300', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon2': '1.146', 'weapon3': '2.004'} +[2023-09-14 14:46:37,812][63769] DAMAGECOUNT value on done: 3443.0 +[2023-09-14 14:46:37,813][63769] Sum rewards: 1.461, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.905', 'AMMO5': '0.009', 'ARMOR': '0.016', 'AMMO2': '0.030', 'AMMO3': '0.070', 'weapon5': '0.142', 'AMMO4': '0.147', 'WEAPON4': '0.150', 'weapon4': '0.160', 'WEAPON5': '0.200', 'HITCOUNT': '0.250', 'WEAPON3': '0.400', 'weapon3': '0.890', 'DAMAGECOUNT': '1.209', 'weapon2': '1.692', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:46:38,077][63770] DAMAGECOUNT value on done: 2186.0 +[2023-09-14 14:46:38,077][63770] Sum rewards: -4.205, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.344', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.005', 'ARMOR': '0.028', 'HITCOUNT': '0.070', 'WEAPON5': '0.100', 'AMMO3': '0.135', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.298', 'weapon3': '1.666'} +[2023-09-14 14:46:38,187][63733] Updated weights for policy 1, policy_version 830 (0.0012) +[2023-09-14 14:46:38,220][63769] DAMAGECOUNT value on done: 1811.0 +[2023-09-14 14:46:38,999][63767] DAMAGECOUNT value on done: 3681.0 +[2023-09-14 14:46:39,000][63767] Sum rewards: -6.860, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.216', 'AMMO5': '0.007', 'AMMO2': '0.028', 'weapon5': '0.050', 'ARMOR': '0.064', 'AMMO4': '0.141', 'AMMO3': '0.148', 'WEAPON5': '0.200', 'weapon4': '0.202', 'HITCOUNT': '0.290', 'WEAPON4': '0.400', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.993', 'weapon3': '1.318', 'weapon2': '1.464'} +[2023-09-14 14:46:39,382][63767] DAMAGECOUNT value on done: 3070.0 +[2023-09-14 14:46:39,383][63767] Sum rewards: -1.774, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.578', 'weapon5': '0.006', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'AMMO5': '0.013', 'AMMO4': '0.042', 'weapon4': '0.046', 'WEAPON4': '0.050', 'ARMOR': '0.076', 'AMMO3': '0.109', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.567', 'WEAPON3': '0.750', 'weapon3': '1.416', 'weapon2': '1.600', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:46:40,569][63767] DAMAGECOUNT value on done: 3615.0 +[2023-09-14 14:46:40,569][63767] Sum rewards: 0.275, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.391', 'ARMOR': '0.004', 'AMMO2': '0.022', 'AMMO5': '0.033', 'AMMO3': '0.108', 'AMMO4': '0.110', 'weapon5': '0.152', 'HITCOUNT': '0.160', 'weapon4': '0.166', 'WEAPON4': '0.250', 'WEAPON5': '0.450', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.705', 'weapon2': '0.872', 'weapon3': '1.734', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:46:40,954][63767] DAMAGECOUNT value on done: 3709.0 +[2023-09-14 14:46:40,954][63767] Sum rewards: -2.623, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.751', 'AMMO5': '0.013', 'ARMOR': '0.016', 'weapon5': '0.028', 'AMMO2': '0.029', 'AMMO3': '0.113', 'AMMO4': '0.144', 'weapon4': '0.156', 'HITCOUNT': '0.160', 'WEAPON5': '0.250', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.615', 'WEAPON3': '0.700', 'weapon3': '1.260', 'weapon2': '1.544', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:46:42,461][63454] Saving new best policy, reward=-3.659! +[2023-09-14 14:46:42,984][63805] DAMAGECOUNT value on done: 2707.0 +[2023-09-14 14:46:42,984][63805] Sum rewards: -6.710, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.734', 'ARMOR': '0.004', 'weapon5': '0.014', 'AMMO5': '0.028', 'AMMO2': '0.030', 'AMMO3': '0.148', 'AMMO4': '0.149', 'weapon4': '0.220', 'HITCOUNT': '0.250', 'WEAPON4': '0.300', 'WEAPON5': '0.450', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.894', 'FRAGCOUNT': '1.000', 'weapon2': '1.210', 'weapon3': '1.478'} +[2023-09-14 14:46:43,352][63805] DAMAGECOUNT value on done: 3187.0 +[2023-09-14 14:46:43,353][63805] Sum rewards: 0.943, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.484', 'AMMO5': '0.005', 'weapon5': '0.022', 'AMMO2': '0.029', 'AMMO3': '0.081', 'WEAPON5': '0.100', 'AMMO4': '0.147', 'weapon4': '0.166', 'HITCOUNT': '0.180', 'WEAPON4': '0.250', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.711', 'weapon2': '1.444', 'weapon3': '1.592', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:46:43,860][63732] Updated weights for policy 0, policy_version 820 (0.0009) +[2023-09-14 14:46:44,823][63734] DAMAGECOUNT value on done: 2090.0 +[2023-09-14 14:46:44,824][63734] Sum rewards: -2.451, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.520', 'AMMO2': '0.013', 'AMMO4': '0.065', 'HITCOUNT': '0.070', 'AMMO3': '0.072', 'WEAPON4': '0.100', 'ARMOR': '0.131', 'DAMAGECOUNT': '0.177', 'weapon4': '0.396', 'WEAPON3': '0.450', 'weapon2': '0.974', 'FRAGCOUNT': '1.000', 'weapon3': '1.370'} +[2023-09-14 14:46:45,184][63733] Updated weights for policy 1, policy_version 840 (0.0010) +[2023-09-14 14:46:45,219][63734] DAMAGECOUNT value on done: 2726.0 +[2023-09-14 14:46:45,220][63734] Sum rewards: -5.562, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.006', 'AMMO5': '0.003', 'weapon5': '0.008', 'AMMO2': '0.014', 'WEAPON5': '0.050', 'AMMO4': '0.069', 'HITCOUNT': '0.080', 'weapon4': '0.094', 'WEAPON4': '0.100', 'AMMO3': '0.104', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.266', 'weapon2': '1.432'} +[2023-09-14 14:46:47,465][63576] Saving new best policy, reward=-4.583! +[2023-09-14 14:46:47,465][63454] Saving new best policy, reward=-3.619! +[2023-09-14 14:46:47,721][63806] DAMAGECOUNT value on done: 2971.0 +[2023-09-14 14:46:47,722][63806] Sum rewards: -6.022, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.188', 'AMMO5': '0.010', 'AMMO2': '0.016', 'ARMOR': '0.044', 'AMMO4': '0.077', 'AMMO3': '0.179', 'weapon4': '0.188', 'HITCOUNT': '0.190', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.750', 'WEAPON3': '0.950', 'weapon2': '1.098', 'weapon3': '1.514', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:46:48,116][63806] DAMAGECOUNT value on done: 1843.0 +[2023-09-14 14:46:48,116][63806] Sum rewards: -10.509, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.387', 'AMMO5': '0.005', 'AMMO2': '0.005', 'WEAPON1': '0.010', 'ARMOR': '0.016', 'HITCOUNT': '0.020', 'AMMO4': '0.026', 'weapon4': '0.030', 'DAMAGECOUNT': '0.045', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.162', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.196', 'weapon2': '1.862'} +[2023-09-14 14:46:49,447][63770] DAMAGECOUNT value on done: 1952.0 +[2023-09-14 14:46:49,447][63770] Sum rewards: -6.017, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.992', 'AMMO2': '0.012', 'AMMO5': '0.022', 'weapon5': '0.028', 'AMMO4': '0.061', 'HITCOUNT': '0.110', 'AMMO3': '0.123', 'WEAPON4': '0.200', 'weapon4': '0.266', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.405', 'ARMOR': '0.448', 'WEAPON3': '0.750', 'weapon2': '1.152', 'weapon3': '1.548'} +[2023-09-14 14:46:49,589][63805] DAMAGECOUNT value on done: 2855.0 +[2023-09-14 14:46:49,589][63805] Sum rewards: -1.030, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.204', 'weapon4': '0.002', 'AMMO2': '0.002', 'AMMO4': '0.011', 'AMMO5': '0.017', 'ARMOR': '0.040', 'weapon5': '0.056', 'AMMO3': '0.087', 'WEAPON4': '0.100', 'WEAPON5': '0.250', 'HITCOUNT': '0.250', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.960', 'weapon3': '1.260', 'weapon2': '1.938', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:46:49,790][63770] DAMAGECOUNT value on done: 2511.0 +[2023-09-14 14:46:49,791][63770] Sum rewards: -2.923, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.510', 'AMMO2': '0.006', 'AMMO4': '0.031', 'ARMOR': '0.040', 'HITCOUNT': '0.070', 'weapon4': '0.082', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.700', 'weapon2': '0.948', 'FRAGCOUNT': '1.000', 'weapon3': '1.792'} +[2023-09-14 14:46:49,954][63805] DAMAGECOUNT value on done: 3098.0 +[2023-09-14 14:46:51,783][63732] Updated weights for policy 0, policy_version 830 (0.0011) +[2023-09-14 14:46:52,143][63733] Updated weights for policy 1, policy_version 850 (0.0011) +[2023-09-14 14:46:53,815][63735] DAMAGECOUNT value on done: 3319.0 +[2023-09-14 14:46:53,816][63735] Sum rewards: -3.131, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.760', 'AMMO2': '0.002', 'AMMO4': '0.007', 'WEAPON4': '0.050', 'ARMOR': '0.088', 'AMMO3': '0.127', 'weapon4': '0.156', 'HITCOUNT': '0.160', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.318', 'weapon3': '1.626'} +[2023-09-14 14:46:54,144][63735] DAMAGECOUNT value on done: 2502.0 +[2023-09-14 14:46:54,145][63735] Sum rewards: -3.014, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.049', 'AMMO2': '0.021', 'AMMO5': '0.037', 'weapon5': '0.058', 'AMMO4': '0.104', 'AMMO3': '0.142', 'WEAPON4': '0.200', 'weapon4': '0.200', 'HITCOUNT': '0.240', 'WEAPON5': '0.550', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.915', 'weapon2': '1.220', 'weapon3': '1.548', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:46:54,198][63735] DAMAGECOUNT value on done: 3137.0 +[2023-09-14 14:46:54,199][63735] Sum rewards: -2.967, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.460', 'AMMO2': '0.011', 'weapon4': '0.022', 'ARMOR': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.057', 'AMMO3': '0.111', 'HITCOUNT': '0.240', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.726', 'FRAGCOUNT': '1.000', 'weapon2': '1.318', 'weapon3': '1.708'} +[2023-09-14 14:46:54,523][63735] DAMAGECOUNT value on done: 2310.0 +[2023-09-14 14:46:54,523][63735] Sum rewards: -4.228, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.400', 'AMMO2': '0.016', 'ARMOR': '0.040', 'HITCOUNT': '0.080', 'AMMO4': '0.081', 'AMMO3': '0.106', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.144', 'weapon3': '1.634'} +[2023-09-14 14:46:56,858][63771] DAMAGECOUNT value on done: 2264.0 +[2023-09-14 14:46:57,211][63771] DAMAGECOUNT value on done: 3593.0 +[2023-09-14 14:46:57,211][63771] Sum rewards: -7.907, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-3.060', 'AMMO4': '-0.045', 'AMMO2': '-0.009', 'AMMO5': '0.005', 'weapon5': '0.006', 'ARMOR': '0.044', 'WEAPON5': '0.100', 'AMMO3': '0.144', 'HITCOUNT': '0.220', 'DAMAGECOUNT': '0.795', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.306', 'weapon3': '1.886'} +[2023-09-14 14:46:57,466][63576] Saving new best policy, reward=-4.559! +[2023-09-14 14:46:57,953][63734] DAMAGECOUNT value on done: 3411.0 +[2023-09-14 14:46:58,361][63734] DAMAGECOUNT value on done: 2278.0 +[2023-09-14 14:46:58,362][63734] Sum rewards: -4.476, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.180', 'AMMO2': '0.004', 'AMMO4': '0.018', 'ARMOR': '0.048', 'HITCOUNT': '0.060', 'weapon4': '0.060', 'WEAPON4': '0.100', 'AMMO3': '0.168', 'DAMAGECOUNT': '0.180', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.248', 'weapon3': '1.918'} +[2023-09-14 14:46:58,969][63733] Updated weights for policy 1, policy_version 860 (0.0012) +[2023-09-14 14:46:59,426][63732] Updated weights for policy 0, policy_version 840 (0.0010) +[2023-09-14 14:47:00,512][63806] DAMAGECOUNT value on done: 3240.0 +[2023-09-14 14:47:00,512][63806] Sum rewards: -4.430, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.811', 'AMMO2': '0.036', 'ARMOR': '0.052', 'AMMO3': '0.117', 'HITCOUNT': '0.140', 'AMMO4': '0.178', 'weapon4': '0.264', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.648', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.262', 'weapon3': '1.384'} +[2023-09-14 14:47:00,719][63771] DAMAGECOUNT value on done: 2659.0 +[2023-09-14 14:47:00,719][63771] Sum rewards: -7.757, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-3.112', 'AMMO2': '0.013', 'AMMO5': '0.029', 'ARMOR': '0.040', 'AMMO4': '0.063', 'weapon5': '0.076', 'AMMO3': '0.176', 'WEAPON4': '0.200', 'HITCOUNT': '0.240', 'weapon4': '0.304', 'WEAPON5': '0.500', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.975', 'FRAGCOUNT': '1.000', 'weapon2': '1.412', 'weapon3': '1.428'} +[2023-09-14 14:47:00,885][63806] DAMAGECOUNT value on done: 3319.0 +[2023-09-14 14:47:00,886][63806] Sum rewards: -5.703, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.090', 'ARMOR': '0.004', 'AMMO5': '0.005', 'weapon5': '0.012', 'AMMO2': '0.033', 'WEAPON5': '0.050', 'HITCOUNT': '0.070', 'AMMO3': '0.082', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO4': '0.167', 'DAMAGECOUNT': '0.240', 'weapon4': '0.324', 'WEAPON4': '0.400', 'WEAPON3': '0.400', 'FRAGCOUNT': '1.000', 'weapon3': '1.060', 'weapon2': '1.740'} +[2023-09-14 14:47:01,138][63767] DAMAGECOUNT value on done: 3971.0 +[2023-09-14 14:47:01,138][63767] Sum rewards: -5.526, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.386', 'AMMO2': '0.005', 'AMMO5': '0.015', 'AMMO4': '0.022', 'WEAPON1': '0.040', 'weapon5': '0.054', 'AMMO3': '0.074', 'WEAPON4': '0.150', 'HITCOUNT': '0.220', 'weapon4': '0.224', 'WEAPON5': '0.300', 'WEAPON3': '0.450', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.870', 'weapon3': '1.286', 'weapon2': '1.400'} +[2023-09-14 14:47:01,139][63771] DAMAGECOUNT value on done: 2258.0 +[2023-09-14 14:47:01,481][63767] DAMAGECOUNT value on done: 3320.0 +[2023-09-14 14:47:01,481][63767] Sum rewards: -3.405, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.859', 'AMMO5': '0.010', 'weapon5': '0.012', 'AMMO2': '0.014', 'ARMOR': '0.040', 'AMMO4': '0.069', 'AMMO3': '0.119', 'WEAPON5': '0.200', 'HITCOUNT': '0.200', 'WEAPON4': '0.250', 'weapon4': '0.550', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.750', 'weapon3': '1.224', 'weapon2': '1.316', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:47:02,088][63769] DAMAGECOUNT value on done: 2301.0 +[2023-09-14 14:47:02,088][63769] Sum rewards: -4.897, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.223', 'AMMO5': '0.010', 'weapon5': '0.010', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'weapon4': '0.052', 'AMMO4': '0.058', 'ARMOR': '0.060', 'WEAPON4': '0.100', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'AMMO3': '0.160', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.270', 'weapon2': '1.554'} +[2023-09-14 14:47:02,461][63576] Saving new best policy, reward=-4.557! +[2023-09-14 14:47:02,513][63454] Saving new best policy, reward=-3.610! +[2023-09-14 14:47:02,519][63769] DAMAGECOUNT value on done: 2917.0 +[2023-09-14 14:47:02,519][63769] Sum rewards: -0.137, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.339', 'weapon7': '0.002', 'ARMOR': '0.004', 'AMMO5': '0.005', 'AMMO2': '0.022', 'WEAPON5': '0.050', 'weapon4': '0.096', 'AMMO4': '0.110', 'AMMO3': '0.147', 'WEAPON4': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.240', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.882', 'weapon2': '1.072', 'FRAGCOUNT': '2.000', 'weapon3': '2.272'} +[2023-09-14 14:47:02,633][63767] DAMAGECOUNT value on done: 3784.0 +[2023-09-14 14:47:02,634][63767] Sum rewards: 0.089, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO5': '0.008', 'AMMO2': '0.028', 'weapon5': '0.032', 'AMMO3': '0.067', 'weapon7': '0.080', 'HITCOUNT': '0.090', 'WEAPON5': '0.100', 'AMMO4': '0.141', 'HEALTH': '0.192', 'WEAPON4': '0.200', 'AMMO6': '0.320', 'AMMO7': '0.320', 'weapon4': '0.346', 'WEAPON7': '0.400', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.507', 'FRAGCOUNT': '1.000', 'weapon3': '1.116', 'weapon2': '1.492'} +[2023-09-14 14:47:02,940][63767] DAMAGECOUNT value on done: 3839.0 +[2023-09-14 14:47:02,941][63767] Sum rewards: -0.198, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.550', 'AMMO2': '0.010', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'weapon5': '0.044', 'AMMO4': '0.052', 'weapon4': '0.058', 'HITCOUNT': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.119', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.450', 'weapon2': '1.288', 'weapon3': '1.486', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:47:03,121][63769] DAMAGECOUNT value on done: 3458.0 +[2023-09-14 14:47:03,122][63769] Sum rewards: -4.240, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.164', 'AMMO5': '0.007', 'HITCOUNT': '0.010', 'weapon5': '0.016', 'AMMO2': '0.017', 'ARMOR': '0.040', 'DAMAGECOUNT': '0.045', 'WEAPON5': '0.050', 'AMMO4': '0.083', 'AMMO3': '0.121', 'WEAPON4': '0.250', 'weapon4': '0.360', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.112', 'weapon2': '1.362'} +[2023-09-14 14:47:03,266][63770] DAMAGECOUNT value on done: 3261.0 +[2023-09-14 14:47:03,506][63769] DAMAGECOUNT value on done: 1924.0 +[2023-09-14 14:47:03,596][63770] DAMAGECOUNT value on done: 2261.0 +[2023-09-14 14:47:05,762][63805] DAMAGECOUNT value on done: 3037.0 +[2023-09-14 14:47:05,763][63805] Sum rewards: -1.948, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.532', 'AMMO2': '0.002', 'AMMO5': '0.010', 'AMMO4': '0.012', 'ARMOR': '0.020', 'WEAPON4': '0.050', 'weapon4': '0.118', 'AMMO3': '0.188', 'WEAPON5': '0.200', 'HITCOUNT': '0.340', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.990', 'weapon2': '1.138', 'weapon3': '2.216', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:47:05,827][63733] Updated weights for policy 1, policy_version 870 (0.0011) +[2023-09-14 14:47:06,098][63805] DAMAGECOUNT value on done: 3402.0 +[2023-09-14 14:47:06,099][63805] Sum rewards: -3.745, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.059', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.005', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'AMMO4': '0.022', 'weapon4': '0.026', 'weapon7': '0.044', 'ARMOR': '0.068', 'AMMO3': '0.075', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'weapon5': '0.108', 'HITCOUNT': '0.190', 'WEAPON5': '0.250', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.645', 'weapon3': '1.198', 'weapon2': '1.800'} +[2023-09-14 14:47:07,167][63732] Updated weights for policy 0, policy_version 850 (0.0011) +[2023-09-14 14:47:07,465][63454] Saving new best policy, reward=-3.400! +[2023-09-14 14:47:08,038][63734] DAMAGECOUNT value on done: 2319.0 +[2023-09-14 14:47:08,038][63734] Sum rewards: -3.497, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.594', 'weapon5': '0.004', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.032', 'ARMOR': '0.081', 'WEAPON5': '0.100', 'AMMO3': '0.101', 'AMMO4': '0.160', 'HITCOUNT': '0.170', 'WEAPON4': '0.350', 'weapon4': '0.358', 'WEAPON3': '0.500', 'weapon3': '0.574', 'DAMAGECOUNT': '0.687', 'FRAGCOUNT': '1.000', 'weapon2': '1.962'} +[2023-09-14 14:47:08,382][63734] DAMAGECOUNT value on done: 2781.0 +[2023-09-14 14:47:10,569][63806] DAMAGECOUNT value on done: 3076.0 +[2023-09-14 14:47:10,570][63806] Sum rewards: -0.879, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.255', 'AMMO5': '0.003', 'AMMO2': '0.029', 'weapon4': '0.062', 'AMMO3': '0.071', 'HITCOUNT': '0.090', 'AMMO4': '0.144', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.400', 'ARMOR': '0.408', 'weapon3': '0.946', 'FRAGCOUNT': '1.000', 'weapon2': '1.008'} +[2023-09-14 14:47:10,882][63806] DAMAGECOUNT value on done: 2117.0 +[2023-09-14 14:47:10,882][63806] Sum rewards: -3.677, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.302', 'AMMO2': '0.018', 'weapon4': '0.054', 'ARMOR': '0.080', 'AMMO4': '0.087', 'WEAPON4': '0.100', 'AMMO3': '0.166', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.822', 'WEAPON3': '0.900', 'weapon2': '1.436', 'weapon3': '1.502', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:47:12,589][63733] Updated weights for policy 1, policy_version 880 (0.0012) +[2023-09-14 14:47:14,205][63805] DAMAGECOUNT value on done: 3171.0 +[2023-09-14 14:47:14,205][63805] Sum rewards: -1.214, reward structure: {'DEATHCOUNT': '-9.000', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.021', 'weapon5': '0.082', 'AMMO3': '0.085', 'AMMO4': '0.104', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'HITCOUNT': '0.260', 'WEAPON3': '0.450', 'HEALTH': '0.456', 'weapon4': '0.506', 'DAMAGECOUNT': '0.948', 'weapon2': '1.054', 'weapon3': '1.502', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:47:14,640][63805] DAMAGECOUNT value on done: 3117.0 +[2023-09-14 14:47:14,837][63770] DAMAGECOUNT value on done: 2207.0 +[2023-09-14 14:47:14,838][63770] Sum rewards: -7.823, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-2.000', 'HEALTH': '-1.570', 'AMMO5': '0.012', 'AMMO2': '0.015', 'weapon5': '0.050', 'AMMO4': '0.076', 'AMMO3': '0.138', 'weapon4': '0.168', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.765', 'weapon2': '1.042', 'weapon3': '1.850'} +[2023-09-14 14:47:14,844][63732] Updated weights for policy 0, policy_version 860 (0.0010) +[2023-09-14 14:47:15,199][63770] DAMAGECOUNT value on done: 2821.0 +[2023-09-14 14:47:15,200][63770] Sum rewards: -2.958, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.532', 'AMMO5': '0.003', 'weapon5': '0.004', 'AMMO2': '0.012', 'WEAPON5': '0.050', 'AMMO4': '0.062', 'AMMO3': '0.157', 'HITCOUNT': '0.260', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.930', 'weapon2': '1.210', 'weapon3': '1.786', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:47:16,239][63735] DAMAGECOUNT value on done: 3354.0 +[2023-09-14 14:47:16,536][63735] DAMAGECOUNT value on done: 3287.0 +[2023-09-14 14:47:16,537][63735] Sum rewards: -3.313, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.920', 'ARMOR': '0.004', 'AMMO2': '0.021', 'weapon4': '0.032', 'AMMO3': '0.102', 'AMMO4': '0.106', 'HITCOUNT': '0.120', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.216', 'weapon2': '1.256'} +[2023-09-14 14:47:17,468][63576] Saving new best policy, reward=-4.471! +[2023-09-14 14:47:18,233][63735] DAMAGECOUNT value on done: 2566.0 +[2023-09-14 14:47:18,539][63735] DAMAGECOUNT value on done: 2375.0 +[2023-09-14 14:47:19,443][63733] Updated weights for policy 1, policy_version 890 (0.0011) +[2023-09-14 14:47:19,887][63771] DAMAGECOUNT value on done: 2304.0 +[2023-09-14 14:47:20,277][63771] DAMAGECOUNT value on done: 3766.0 +[2023-09-14 14:47:20,277][63771] Sum rewards: -3.882, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.346', 'AMMO5': '0.003', 'AMMO2': '0.004', 'AMMO4': '0.019', 'ARMOR': '0.050', 'WEAPON4': '0.100', 'AMMO3': '0.115', 'HITCOUNT': '0.120', 'weapon4': '0.130', 'DAMAGECOUNT': '0.519', 'WEAPON3': '0.600', 'weapon2': '1.324', 'weapon3': '1.480', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:47:22,462][63576] Saving new best policy, reward=-4.459! +[2023-09-14 14:47:22,512][63732] Updated weights for policy 0, policy_version 870 (0.0011) +[2023-09-14 14:47:22,936][63734] DAMAGECOUNT value on done: 3578.0 +[2023-09-14 14:47:22,936][63734] Sum rewards: 2.006, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.005', 'AMMO2': '0.027', 'AMMO3': '0.050', 'ARMOR': '0.064', 'HITCOUNT': '0.070', 'weapon5': '0.082', 'WEAPON5': '0.100', 'AMMO4': '0.132', 'WEAPON4': '0.150', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.501', 'HEALTH': '0.517', 'weapon4': '0.750', 'weapon3': '1.032', 'weapon2': '1.476', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:47:23,123][63767] DAMAGECOUNT value on done: 4134.0 +[2023-09-14 14:47:23,123][63767] Sum rewards: -1.629, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.112', 'ARMOR': '0.008', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'AMMO5': '0.020', 'weapon5': '0.086', 'AMMO4': '0.087', 'HITCOUNT': '0.130', 'AMMO3': '0.142', 'WEAPON4': '0.150', 'weapon4': '0.320', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.489', 'WEAPON3': '0.850', 'weapon2': '1.358', 'weapon3': '1.416', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:47:23,333][63734] DAMAGECOUNT value on done: 2307.0 +[2023-09-14 14:47:23,488][63767] DAMAGECOUNT value on done: 3512.0 +[2023-09-14 14:47:24,682][63767] DAMAGECOUNT value on done: 4146.0 +[2023-09-14 14:47:24,683][63767] Sum rewards: -0.529, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.389', 'AMMO5': '0.020', 'WEAPON1': '0.030', 'AMMO2': '0.040', 'AMMO3': '0.060', 'ARMOR': '0.068', 'weapon5': '0.078', 'AMMO4': '0.202', 'WEAPON5': '0.250', 'WEAPON4': '0.250', 'HITCOUNT': '0.290', 'WEAPON3': '0.350', 'weapon4': '0.404', 'DAMAGECOUNT': '1.086', 'weapon3': '1.206', 'FRAGCOUNT': '1.500', 'weapon2': '1.526'} +[2023-09-14 14:47:24,831][63806] DAMAGECOUNT value on done: 3255.0 +[2023-09-14 14:47:25,058][63767] DAMAGECOUNT value on done: 4244.0 +[2023-09-14 14:47:25,059][63767] Sum rewards: -3.292, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.654', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.018', 'weapon5': '0.030', 'ARMOR': '0.040', 'AMMO4': '0.090', 'WEAPON5': '0.100', 'AMMO3': '0.153', 'WEAPON4': '0.200', 'HITCOUNT': '0.310', 'weapon4': '0.336', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.215', 'weapon2': '1.508', 'weapon3': '1.546', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:47:25,273][63806] DAMAGECOUNT value on done: 3663.0 +[2023-09-14 14:47:25,274][63806] Sum rewards: 0.684, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.118', 'AMMO5': '0.015', 'ARMOR': '0.020', 'AMMO2': '0.021', 'weapon5': '0.096', 'WEAPON4': '0.100', 'AMMO4': '0.104', 'AMMO3': '0.118', 'weapon4': '0.154', 'HITCOUNT': '0.160', 'WEAPON5': '0.300', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.032', 'weapon3': '1.384', 'weapon2': '1.648', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:47:25,544][63771] DAMAGECOUNT value on done: 2824.0 +[2023-09-14 14:47:25,544][63771] Sum rewards: -3.099, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.898', 'AMMO2': '0.008', 'AMMO5': '0.014', 'weapon5': '0.036', 'AMMO4': '0.037', 'WEAPON4': '0.050', 'AMMO3': '0.092', 'ARMOR': '0.108', 'weapon4': '0.114', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.098', 'weapon2': '1.526'} +[2023-09-14 14:47:25,952][63771] DAMAGECOUNT value on done: 2413.0 +[2023-09-14 14:47:25,952][63771] Sum rewards: -3.449, reward structure: {'DEATHCOUNT': '-9.000', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.010', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'AMMO4': '0.052', 'AMMO3': '0.100', 'WEAPON5': '0.100', 'HEALTH': '0.112', 'HITCOUNT': '0.140', 'weapon4': '0.200', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.102', 'weapon3': '1.562'} +[2023-09-14 14:47:26,365][63733] Updated weights for policy 1, policy_version 900 (0.0011) +[2023-09-14 14:47:27,098][63769] DAMAGECOUNT value on done: 2446.0 +[2023-09-14 14:47:27,098][63769] Sum rewards: -8.579, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-3.030', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.030', 'weapon4': '0.032', 'ARMOR': '0.064', 'WEAPON5': '0.100', 'HITCOUNT': '0.120', 'AMMO4': '0.150', 'WEAPON4': '0.200', 'AMMO3': '0.214', 'DAMAGECOUNT': '0.435', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.250', 'weapon2': '1.318', 'weapon3': '1.522'} +[2023-09-14 14:47:27,466][63454] Saving new best policy, reward=-3.336! +[2023-09-14 14:47:27,531][63769] DAMAGECOUNT value on done: 3007.0 +[2023-09-14 14:47:27,532][63769] Sum rewards: 1.974, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-0.230', 'AMMO2': '0.002', 'AMMO5': '0.009', 'AMMO4': '0.011', 'weapon5': '0.042', 'WEAPON4': '0.050', 'AMMO3': '0.083', 'HITCOUNT': '0.090', 'weapon4': '0.094', 'ARMOR': '0.096', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.400', 'weapon3': '1.100', 'weapon2': '1.506', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:47:28,207][63769] DAMAGECOUNT value on done: 3598.0 +[2023-09-14 14:47:28,207][63769] Sum rewards: -4.506, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.830', 'ARMOR': '0.008', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.027', 'WEAPON5': '0.050', 'AMMO4': '0.133', 'HITCOUNT': '0.140', 'AMMO3': '0.154', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.420', 'weapon4': '0.616', 'weapon3': '0.720', 'WEAPON3': '0.750', 'weapon2': '1.788', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:47:28,616][63769] DAMAGECOUNT value on done: 1959.0 +[2023-09-14 14:47:28,620][63805] DAMAGECOUNT value on done: 3276.0 +[2023-09-14 14:47:28,620][63805] Sum rewards: -2.699, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.108', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'ARMOR': '0.012', 'AMMO5': '0.027', 'AMMO4': '0.035', 'weapon5': '0.084', 'AMMO3': '0.160', 'HITCOUNT': '0.170', 'WEAPON4': '0.200', 'weapon4': '0.210', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.717', 'WEAPON3': '0.900', 'weapon2': '1.324', 'FRAGCOUNT': '1.500', 'weapon3': '1.902'} +[2023-09-14 14:47:28,635][63770] DAMAGECOUNT value on done: 3692.0 +[2023-09-14 14:47:28,636][63770] Sum rewards: -1.451, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.379', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'ARMOR': '0.004', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'weapon5': '0.160', 'AMMO3': '0.195', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '1.100', 'DAMAGECOUNT': '1.293', 'weapon2': '1.378', 'weapon3': '1.892', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:47:29,018][63805] DAMAGECOUNT value on done: 3702.0 +[2023-09-14 14:47:29,019][63805] Sum rewards: -5.185, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.485', 'AMMO2': '0.006', 'AMMO5': '0.017', 'AMMO4': '0.029', 'ARMOR': '0.036', 'weapon5': '0.038', 'AMMO3': '0.128', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'HITCOUNT': '0.250', 'weapon4': '0.386', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.900', 'weapon2': '1.324', 'weapon3': '1.686'} +[2023-09-14 14:47:29,026][63770] DAMAGECOUNT value on done: 2525.0 +[2023-09-14 14:47:30,420][63732] Updated weights for policy 0, policy_version 880 (0.0011) +[2023-09-14 14:47:31,655][63734] DAMAGECOUNT value on done: 2469.0 +[2023-09-14 14:47:31,655][63734] Sum rewards: -0.479, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.360', 'AMMO2': '0.003', 'AMMO4': '0.014', 'ARMOR': '0.092', 'HITCOUNT': '0.100', 'AMMO3': '0.128', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.750', 'weapon2': '1.238', 'weapon3': '1.606', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:47:32,065][63734] DAMAGECOUNT value on done: 2851.0 +[2023-09-14 14:47:32,066][63734] Sum rewards: -2.741, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.591', 'weapon5': '0.002', 'ARMOR': '0.004', 'AMMO2': '0.009', 'AMMO5': '0.010', 'AMMO4': '0.044', 'HITCOUNT': '0.080', 'AMMO3': '0.163', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.180', 'weapon2': '1.798'} +[2023-09-14 14:47:32,461][63454] Saving new best policy, reward=-3.276! +[2023-09-14 14:47:32,461][63576] Saving new best policy, reward=-4.414! +[2023-09-14 14:47:33,274][63806] DAMAGECOUNT value on done: 3196.0 +[2023-09-14 14:47:33,388][63733] Updated weights for policy 1, policy_version 910 (0.0012) +[2023-09-14 14:47:33,633][63806] DAMAGECOUNT value on done: 2414.0 +[2023-09-14 14:47:33,633][63806] Sum rewards: -2.333, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.209', 'AMMO2': '0.000', 'AMMO4': '0.002', 'AMMO5': '0.005', 'ARMOR': '0.032', 'weapon5': '0.046', 'AMMO3': '0.090', 'WEAPON5': '0.100', 'HITCOUNT': '0.160', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.891', 'FRAGCOUNT': '1.000', 'weapon2': '1.108', 'weapon3': '1.442'} +[2023-09-14 14:47:37,497][63576] Saving new best policy, reward=-4.370! +[2023-09-14 14:47:38,226][63732] Updated weights for policy 0, policy_version 890 (0.0011) +[2023-09-14 14:47:38,924][63735] DAMAGECOUNT value on done: 3693.0 +[2023-09-14 14:47:38,924][63735] Sum rewards: -3.098, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.034', 'ARMOR': '0.004', 'AMMO5': '0.005', 'weapon5': '0.016', 'AMMO2': '0.017', 'weapon4': '0.052', 'AMMO4': '0.085', 'WEAPON5': '0.100', 'AMMO3': '0.133', 'WEAPON4': '0.150', 'HITCOUNT': '0.280', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.017', 'weapon2': '1.076', 'weapon3': '1.550', 'FRAGCOUNT': '2.500'} +[2023-09-14 14:47:39,172][63805] DAMAGECOUNT value on done: 3942.0 +[2023-09-14 14:47:39,172][63805] Sum rewards: 0.853, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO2': '0.004', 'AMMO5': '0.017', 'AMMO4': '0.022', 'ARMOR': '0.084', 'weapon5': '0.108', 'AMMO3': '0.132', 'HEALTH': '0.236', 'WEAPON5': '0.300', 'HITCOUNT': '0.410', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.750', 'weapon2': '1.264', 'weapon3': '2.212', 'DAMAGECOUNT': '2.313'} +[2023-09-14 14:47:39,255][63735] DAMAGECOUNT value on done: 3372.0 +[2023-09-14 14:47:39,587][63805] DAMAGECOUNT value on done: 3182.0 +[2023-09-14 14:47:39,587][63805] Sum rewards: -4.346, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.672', 'AMMO5': '0.007', 'AMMO2': '0.009', 'ARMOR': '0.020', 'AMMO4': '0.046', 'HITCOUNT': '0.070', 'AMMO3': '0.126', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.195', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.426', 'weapon3': '1.526'} +[2023-09-14 14:47:40,279][63733] Updated weights for policy 1, policy_version 920 (0.0011) +[2023-09-14 14:47:40,294][63770] DAMAGECOUNT value on done: 2502.0 +[2023-09-14 14:47:40,295][63770] Sum rewards: -8.434, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.824', 'FRAGCOUNT': '-1.000', 'AMMO2': '0.012', 'AMMO5': '0.017', 'ARMOR': '0.032', 'AMMO4': '0.062', 'weapon5': '0.074', 'WEAPON4': '0.100', 'AMMO3': '0.188', 'HITCOUNT': '0.190', 'weapon4': '0.274', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.885', 'WEAPON3': '1.100', 'weapon2': '1.456', 'weapon3': '1.700'} +[2023-09-14 14:47:40,670][63770] DAMAGECOUNT value on done: 3130.0 +[2023-09-14 14:47:40,670][63770] Sum rewards: -3.501, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.847', 'AMMO5': '0.010', 'AMMO2': '0.010', 'AMMO4': '0.050', 'WEAPON4': '0.100', 'weapon4': '0.106', 'WEAPON5': '0.150', 'AMMO3': '0.200', 'HITCOUNT': '0.260', 'ARMOR': '0.412', 'weapon2': '0.770', 'DAMAGECOUNT': '0.927', 'WEAPON3': '1.200', 'weapon3': '2.150', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:47:42,461][63454] Saving new best policy, reward=-3.265! +[2023-09-14 14:47:42,584][63735] DAMAGECOUNT value on done: 3146.0 +[2023-09-14 14:47:42,584][63735] Sum rewards: -0.525, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.390', 'AMMO2': '0.015', 'AMMO5': '0.016', 'ARMOR': '0.036', 'AMMO4': '0.072', 'AMMO3': '0.114', 'weapon5': '0.128', 'WEAPON4': '0.150', 'weapon4': '0.204', 'WEAPON5': '0.300', 'HITCOUNT': '0.310', 'WEAPON3': '0.700', 'weapon2': '1.526', 'weapon3': '1.554', 'DAMAGECOUNT': '1.740', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:47:42,911][63735] DAMAGECOUNT value on done: 2395.0 +[2023-09-14 14:47:43,395][63771] DAMAGECOUNT value on done: 2414.0 +[2023-09-14 14:47:43,396][63771] Sum rewards: -5.925, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.388', 'AMMO5': '0.005', 'AMMO2': '0.008', 'WEAPON1': '0.020', 'weapon5': '0.032', 'AMMO4': '0.041', 'ARMOR': '0.056', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.122', 'weapon4': '0.146', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.076', 'weapon2': '1.326'} +[2023-09-14 14:47:43,783][63771] DAMAGECOUNT value on done: 3856.0 +[2023-09-14 14:47:43,784][63771] Sum rewards: -3.385, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.093', 'AMMO5': '0.010', 'AMMO2': '0.016', 'WEAPON1': '0.030', 'HITCOUNT': '0.070', 'AMMO3': '0.075', 'AMMO4': '0.080', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon2': '1.354', 'weapon3': '1.452'} +[2023-09-14 14:47:45,752][63767] DAMAGECOUNT value on done: 4250.0 +[2023-09-14 14:47:46,050][63732] Updated weights for policy 0, policy_version 900 (0.0011) +[2023-09-14 14:47:46,165][63767] DAMAGECOUNT value on done: 3919.0 +[2023-09-14 14:47:47,125][63733] Updated weights for policy 1, policy_version 930 (0.0011) +[2023-09-14 14:47:47,435][63767] DAMAGECOUNT value on done: 4515.0 +[2023-09-14 14:47:47,436][63767] Sum rewards: -5.838, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.106', 'AMMO5': '0.011', 'AMMO2': '0.029', 'weapon5': '0.128', 'AMMO4': '0.143', 'WEAPON5': '0.200', 'AMMO3': '0.214', 'HITCOUNT': '0.260', 'weapon4': '0.292', 'WEAPON4': '0.300', 'FRAGCOUNT': '0.500', 'ARMOR': '0.618', 'DAMAGECOUNT': '1.107', 'WEAPON3': '1.200', 'weapon3': '1.586', 'weapon2': '1.680'} +[2023-09-14 14:47:47,466][63454] Saving new best policy, reward=-3.227! +[2023-09-14 14:47:47,819][63767] DAMAGECOUNT value on done: 4448.0 +[2023-09-14 14:47:47,819][63767] Sum rewards: -5.578, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.020', 'FRAGCOUNT': '-0.500', 'ARMOR': '0.012', 'AMMO5': '0.020', 'WEAPON1': '0.020', 'AMMO2': '0.026', 'weapon5': '0.084', 'AMMO3': '0.127', 'AMMO4': '0.131', 'HITCOUNT': '0.180', 'WEAPON4': '0.300', 'WEAPON5': '0.450', 'weapon4': '0.514', 'DAMAGECOUNT': '0.612', 'WEAPON3': '0.750', 'weapon2': '1.226', 'weapon3': '1.490'} +[2023-09-14 14:47:48,353][63734] DAMAGECOUNT value on done: 4013.0 +[2023-09-14 14:47:48,354][63734] Sum rewards: 0.450, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.447', 'AMMO5': '0.014', 'weapon5': '0.020', 'AMMO2': '0.020', 'ARMOR': '0.024', 'AMMO4': '0.100', 'AMMO3': '0.142', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'HITCOUNT': '0.280', 'weapon4': '0.514', 'WEAPON3': '0.750', 'weapon2': '0.890', 'DAMAGECOUNT': '1.305', 'weapon3': '1.888', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:47:48,760][63734] DAMAGECOUNT value on done: 2455.0 +[2023-09-14 14:47:48,761][63734] Sum rewards: -7.424, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.756', 'weapon5': '0.002', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.019', 'ARMOR': '0.040', 'AMMO4': '0.093', 'HITCOUNT': '0.130', 'weapon4': '0.130', 'AMMO3': '0.135', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.444', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.004', 'weapon2': '1.512'} +[2023-09-14 14:47:49,051][63806] DAMAGECOUNT value on done: 3385.0 +[2023-09-14 14:47:49,051][63806] Sum rewards: -4.172, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.281', 'AMMO2': '0.006', 'AMMO5': '0.010', 'AMMO4': '0.030', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'ARMOR': '0.105', 'AMMO3': '0.106', 'HITCOUNT': '0.120', 'weapon4': '0.120', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.202', 'weapon2': '1.520'} +[2023-09-14 14:47:49,462][63806] DAMAGECOUNT value on done: 3833.0 +[2023-09-14 14:47:49,462][63806] Sum rewards: 1.252, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.152', 'AMMO5': '0.007', 'AMMO2': '0.023', 'weapon7': '0.056', 'AMMO3': '0.058', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.113', 'weapon5': '0.150', 'HITCOUNT': '0.180', 'weapon4': '0.278', 'AMMO6': '0.300', 'WEAPON7': '0.300', 'AMMO7': '0.300', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.510', 'FRAGCOUNT': '1.000', 'weapon3': '1.174', 'weapon2': '1.196', 'ARMOR': '1.208'} +[2023-09-14 14:47:50,656][63771] DAMAGECOUNT value on done: 3375.0 +[2023-09-14 14:47:50,657][63771] Sum rewards: -2.204, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.101', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'AMMO5': '0.010', 'weapon5': '0.072', 'WEAPON4': '0.100', 'AMMO3': '0.152', 'WEAPON5': '0.250', 'HITCOUNT': '0.320', 'weapon4': '0.322', 'ARMOR': '0.567', 'WEAPON3': '0.750', 'weapon3': '1.534', 'DAMAGECOUNT': '1.653', 'weapon2': '1.668', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:47:51,038][63771] DAMAGECOUNT value on done: 2621.0 +[2023-09-14 14:47:51,039][63771] Sum rewards: -6.275, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.493', 'AMMO5': '0.005', 'AMMO2': '0.012', 'ARMOR': '0.048', 'AMMO4': '0.058', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.129', 'HITCOUNT': '0.160', 'weapon4': '0.200', 'DAMAGECOUNT': '0.624', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.262', 'weapon2': '1.270'} +[2023-09-14 14:47:51,686][63805] DAMAGECOUNT value on done: 3692.0 +[2023-09-14 14:47:51,687][63805] Sum rewards: -2.273, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.884', 'AMMO2': '0.019', 'WEAPON1': '0.020', 'ARMOR': '0.025', 'AMMO5': '0.031', 'AMMO4': '0.093', 'AMMO3': '0.118', 'weapon4': '0.224', 'weapon5': '0.238', 'WEAPON4': '0.250', 'HITCOUNT': '0.300', 'WEAPON5': '0.450', 'WEAPON3': '0.750', 'weapon3': '1.240', 'DAMAGECOUNT': '1.248', 'weapon2': '1.356', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:47:52,000][63805] DAMAGECOUNT value on done: 4353.0 +[2023-09-14 14:47:52,001][63805] Sum rewards: 0.132, reward structure: {'DEATHCOUNT': '-9.750', 'AMMO5': '0.016', 'ARMOR': '0.032', 'AMMO2': '0.040', 'HEALTH': '0.048', 'AMMO3': '0.106', 'weapon5': '0.144', 'AMMO4': '0.200', 'WEAPON4': '0.250', 'WEAPON5': '0.300', 'weapon4': '0.340', 'HITCOUNT': '0.390', 'WEAPON3': '0.600', 'weapon2': '1.410', 'weapon3': '1.552', 'DAMAGECOUNT': '1.953', 'FRAGCOUNT': '2.500'} +[2023-09-14 14:47:52,472][63769] DAMAGECOUNT value on done: 2660.0 +[2023-09-14 14:47:52,473][63769] Sum rewards: -4.309, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.000', 'AMMO5': '0.005', 'AMMO2': '0.014', 'weapon5': '0.018', 'ARMOR': '0.044', 'AMMO4': '0.068', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.143', 'weapon4': '0.168', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.642', 'WEAPON3': '0.850', 'weapon2': '1.148', 'weapon3': '1.182', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:47:52,895][63769] DAMAGECOUNT value on done: 3549.0 +[2023-09-14 14:47:52,895][63769] Sum rewards: -0.773, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.735', 'ARMOR': '0.004', 'AMMO5': '0.005', 'AMMO2': '0.017', 'WEAPON5': '0.050', 'weapon5': '0.050', 'weapon7': '0.052', 'AMMO4': '0.084', 'AMMO3': '0.088', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON4': '0.150', 'HITCOUNT': '0.260', 'weapon4': '0.266', 'WEAPON3': '0.600', 'weapon3': '1.304', 'weapon2': '1.606', 'DAMAGECOUNT': '1.626', 'FRAGCOUNT': '2.500'} +[2023-09-14 14:47:53,543][63769] DAMAGECOUNT value on done: 4214.0 +[2023-09-14 14:47:53,544][63769] Sum rewards: 0.875, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.620', 'AMMO2': '0.006', 'AMMO5': '0.022', 'AMMO4': '0.032', 'AMMO3': '0.078', 'WEAPON4': '0.150', 'weapon5': '0.248', 'HITCOUNT': '0.310', 'weapon4': '0.394', 'WEAPON5': '0.400', 'ARMOR': '0.451', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon2': '1.096', 'weapon3': '1.660', 'DAMAGECOUNT': '1.848'} +[2023-09-14 14:47:53,878][63770] DAMAGECOUNT value on done: 3835.0 +[2023-09-14 14:47:53,878][63770] Sum rewards: -5.856, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.541', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.026', 'AMMO2': '0.030', 'WEAPON1': '0.030', 'ARMOR': '0.036', 'AMMO3': '0.105', 'AMMO4': '0.149', 'weapon5': '0.152', 'HITCOUNT': '0.160', 'weapon4': '0.348', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.429', 'WEAPON5': '0.450', 'WEAPON3': '0.750', 'weapon2': '1.088', 'weapon3': '1.582'} +[2023-09-14 14:47:53,897][63769] DAMAGECOUNT value on done: 2054.0 +[2023-09-14 14:47:53,897][63769] Sum rewards: -3.227, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.046', 'AMMO2': '0.001', 'AMMO4': '0.006', 'ARMOR': '0.028', 'HITCOUNT': '0.090', 'AMMO3': '0.114', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.700', 'weapon2': '1.186', 'weapon3': '1.658', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:47:53,965][63732] Updated weights for policy 0, policy_version 910 (0.0010) +[2023-09-14 14:47:54,062][63733] Updated weights for policy 1, policy_version 940 (0.0011) +[2023-09-14 14:47:54,322][63770] DAMAGECOUNT value on done: 2719.0 +[2023-09-14 14:47:54,323][63770] Sum rewards: -2.621, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.113', 'AMMO5': '0.005', 'AMMO2': '0.012', 'AMMO4': '0.061', 'AMMO3': '0.071', 'weapon4': '0.074', 'ARMOR': '0.076', 'HITCOUNT': '0.120', 'WEAPON4': '0.150', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.582', 'weapon3': '0.794', 'weapon2': '1.596', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:47:55,123][63734] DAMAGECOUNT value on done: 2569.0 +[2023-09-14 14:47:55,509][63734] DAMAGECOUNT value on done: 2906.0 +[2023-09-14 14:47:55,509][63734] Sum rewards: -7.511, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.760', 'AMMO4': '-0.058', 'AMMO2': '-0.011', 'AMMO5': '0.005', 'weapon7': '0.008', 'ARMOR': '0.040', 'HITCOUNT': '0.060', 'AMMO3': '0.128', 'DAMAGECOUNT': '0.165', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.340', 'weapon2': '1.722'} +[2023-09-14 14:47:55,839][63806] DAMAGECOUNT value on done: 3381.0 +[2023-09-14 14:47:55,839][63806] Sum rewards: -4.740, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.710', 'AMMO2': '0.017', 'WEAPON4': '0.050', 'ARMOR': '0.053', 'AMMO4': '0.082', 'weapon4': '0.120', 'AMMO3': '0.133', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.336', 'weapon2': '1.554'} +[2023-09-14 14:47:56,215][63806] DAMAGECOUNT value on done: 2554.0 +[2023-09-14 14:48:00,803][63733] Updated weights for policy 1, policy_version 950 (0.0010) +[2023-09-14 14:48:01,680][63732] Updated weights for policy 0, policy_version 920 (0.0011) +[2023-09-14 14:48:01,728][63735] DAMAGECOUNT value on done: 3848.0 +[2023-09-14 14:48:01,728][63735] Sum rewards: -7.437, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.354', 'AMMO5': '0.005', 'AMMO2': '0.015', 'ARMOR': '0.044', 'AMMO4': '0.072', 'weapon4': '0.082', 'WEAPON5': '0.100', 'WEAPON4': '0.150', 'AMMO3': '0.158', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.134', 'weapon3': '1.672'} +[2023-09-14 14:48:02,059][63735] DAMAGECOUNT value on done: 3431.0 +[2023-09-14 14:48:03,972][63805] DAMAGECOUNT value on done: 4167.0 +[2023-09-14 14:48:03,973][63805] Sum rewards: -8.040, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-2.000', 'HEALTH': '-1.399', 'AMMO5': '0.011', 'AMMO2': '0.019', 'ARMOR': '0.040', 'AMMO4': '0.093', 'WEAPON4': '0.150', 'HITCOUNT': '0.150', 'weapon4': '0.152', 'AMMO3': '0.155', 'weapon5': '0.216', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.950', 'weapon2': '1.152', 'weapon3': '1.796'} +[2023-09-14 14:48:04,364][63805] DAMAGECOUNT value on done: 3337.0 +[2023-09-14 14:48:04,365][63805] Sum rewards: -3.505, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.438', 'AMMO2': '0.017', 'weapon4': '0.032', 'ARMOR': '0.040', 'AMMO4': '0.084', 'WEAPON4': '0.100', 'AMMO3': '0.107', 'HITCOUNT': '0.120', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.216', 'weapon3': '1.402'} +[2023-09-14 14:48:05,508][63770] DAMAGECOUNT value on done: 2962.0 +[2023-09-14 14:48:05,509][63770] Sum rewards: -2.714, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.803', 'AMMO5': '0.018', 'AMMO2': '0.028', 'ARMOR': '0.064', 'weapon5': '0.072', 'AMMO3': '0.137', 'AMMO4': '0.140', 'WEAPON4': '0.200', 'weapon4': '0.230', 'WEAPON5': '0.300', 'HITCOUNT': '0.390', 'WEAPON3': '0.850', 'weapon2': '1.022', 'DAMAGECOUNT': '1.380', 'FRAGCOUNT': '2.000', 'weapon3': '2.008'} +[2023-09-14 14:48:05,915][63770] DAMAGECOUNT value on done: 3240.0 +[2023-09-14 14:48:06,529][63771] DAMAGECOUNT value on done: 2485.0 +[2023-09-14 14:48:06,894][63771] DAMAGECOUNT value on done: 3935.0 +[2023-09-14 14:48:07,170][63735] DAMAGECOUNT value on done: 3431.0 +[2023-09-14 14:48:07,171][63735] Sum rewards: -6.303, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.476', 'AMMO5': '0.010', 'AMMO2': '0.014', 'ARMOR': '0.040', 'AMMO4': '0.068', 'weapon4': '0.088', 'weapon5': '0.114', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'AMMO3': '0.210', 'HITCOUNT': '0.240', 'DAMAGECOUNT': '0.855', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.200', 'weapon2': '1.200', 'weapon3': '2.084'} +[2023-09-14 14:48:07,603][63735] DAMAGECOUNT value on done: 2528.0 +[2023-09-14 14:48:08,090][63733] Updated weights for policy 1, policy_version 960 (0.0012) +[2023-09-14 14:48:08,346][63767] DAMAGECOUNT value on done: 4479.0 +[2023-09-14 14:48:08,347][63767] Sum rewards: -7.117, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.390', 'AMMO5': '0.007', 'AMMO2': '0.019', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'weapon5': '0.068', 'weapon4': '0.090', 'AMMO4': '0.096', 'AMMO3': '0.131', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'DAMAGECOUNT': '0.687', 'WEAPON3': '0.850', 'weapon2': '1.124', 'weapon3': '1.940'} +[2023-09-14 14:48:08,666][63767] DAMAGECOUNT value on done: 4097.0 +[2023-09-14 14:48:08,666][63767] Sum rewards: -4.000, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.599', 'AMMO5': '0.007', 'AMMO2': '0.016', 'weapon5': '0.026', 'ARMOR': '0.061', 'AMMO4': '0.081', 'AMMO3': '0.089', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'HITCOUNT': '0.200', 'weapon4': '0.326', 'DAMAGECOUNT': '0.534', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.122', 'weapon2': '1.436'} +[2023-09-14 14:48:09,039][63732] Updated weights for policy 0, policy_version 930 (0.0011) +[2023-09-14 14:48:09,846][63767] DAMAGECOUNT value on done: 4755.0 +[2023-09-14 14:48:09,847][63767] Sum rewards: -3.036, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.566', 'AMMO5': '0.007', 'weapon5': '0.018', 'AMMO2': '0.021', 'ARMOR': '0.036', 'weapon4': '0.038', 'AMMO3': '0.082', 'AMMO4': '0.104', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.720', 'weapon3': '1.390', 'weapon2': '1.664', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:48:10,189][63767] DAMAGECOUNT value on done: 4895.0 +[2023-09-14 14:48:10,190][63767] Sum rewards: -1.612, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.950', 'AMMO5': '0.012', 'AMMO2': '0.015', 'ARMOR': '0.036', 'weapon4': '0.056', 'weapon5': '0.062', 'AMMO4': '0.072', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'AMMO3': '0.162', 'HITCOUNT': '0.320', 'WEAPON3': '0.950', 'weapon2': '1.282', 'DAMAGECOUNT': '1.341', 'weapon3': '2.030', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:48:12,462][63454] Saving new best policy, reward=-3.221! +[2023-09-14 14:48:13,173][63806] DAMAGECOUNT value on done: 3695.0 +[2023-09-14 14:48:13,173][63806] Sum rewards: -3.769, reward structure: {'DEATHCOUNT': '-9.750', 'AMMO2': '0.004', 'AMMO4': '0.021', 'HEALTH': '0.022', 'ARMOR': '0.028', 'AMMO3': '0.130', 'HITCOUNT': '0.270', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.930', 'FRAGCOUNT': '1.000', 'weapon2': '1.252', 'weapon3': '1.624'} +[2023-09-14 14:48:13,363][63734] DAMAGECOUNT value on done: 4318.0 +[2023-09-14 14:48:13,364][63734] Sum rewards: -4.632, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.915', 'WEAPON1': '0.010', 'AMMO2': '0.013', 'AMMO5': '0.015', 'ARMOR': '0.032', 'weapon4': '0.062', 'AMMO4': '0.065', 'AMMO3': '0.140', 'WEAPON4': '0.150', 'weapon5': '0.168', 'HITCOUNT': '0.250', 'WEAPON5': '0.300', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.915', 'FRAGCOUNT': '1.000', 'weapon3': '1.432', 'weapon2': '1.480'} +[2023-09-14 14:48:13,508][63806] DAMAGECOUNT value on done: 4060.0 +[2023-09-14 14:48:13,509][63806] Sum rewards: -8.030, reward structure: {'DEATHCOUNT': '-11.250', 'FRAGCOUNT': '-2.000', 'HEALTH': '-0.190', 'AMMO5': '0.007', 'ARMOR': '0.024', 'AMMO2': '0.039', 'weapon5': '0.052', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'weapon4': '0.102', 'AMMO3': '0.126', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'AMMO4': '0.192', 'WEAPON4': '0.300', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.681', 'weapon3': '1.246', 'weapon2': '1.520'} +[2023-09-14 14:48:13,735][63734] DAMAGECOUNT value on done: 2663.0 +[2023-09-14 14:48:13,736][63734] Sum rewards: 1.661, reward structure: {'DEATHCOUNT': '-4.500', 'weapon5': '0.002', 'AMMO5': '0.005', 'AMMO2': '0.007', 'AMMO4': '0.036', 'weapon7': '0.042', 'WEAPON5': '0.050', 'AMMO3': '0.080', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'HITCOUNT': '0.120', 'WEAPON3': '0.300', 'ARMOR': '0.500', 'DAMAGECOUNT': '0.624', 'HEALTH': '0.710', 'weapon3': '0.958', 'FRAGCOUNT': '1.000', 'weapon2': '1.426'} +[2023-09-14 14:48:14,301][63805] DAMAGECOUNT value on done: 4019.0 +[2023-09-14 14:48:14,302][63805] Sum rewards: -0.273, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.468', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'AMMO5': '0.003', 'weapon4': '0.046', 'WEAPON4': '0.050', 'weapon5': '0.050', 'AMMO3': '0.093', 'WEAPON5': '0.100', 'HITCOUNT': '0.200', 'WEAPON3': '0.350', 'FRAGCOUNT': '0.500', 'ARMOR': '0.512', 'DAMAGECOUNT': '0.981', 'weapon2': '1.132', 'weapon3': '1.442'} +[2023-09-14 14:48:14,653][63805] DAMAGECOUNT value on done: 4733.0 +[2023-09-14 14:48:14,654][63805] Sum rewards: -0.854, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.560', 'AMMO2': '0.003', 'AMMO4': '0.013', 'weapon4': '0.032', 'WEAPON4': '0.050', 'weapon7': '0.070', 'AMMO3': '0.116', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'HITCOUNT': '0.230', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.140', 'weapon2': '1.314', 'weapon3': '1.548'} +[2023-09-14 14:48:14,834][63733] Updated weights for policy 1, policy_version 970 (0.0011) +[2023-09-14 14:48:15,834][63771] DAMAGECOUNT value on done: 3952.0 +[2023-09-14 14:48:15,835][63771] Sum rewards: 3.371, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.354', 'AMMO2': '0.003', 'ARMOR': '0.012', 'AMMO4': '0.014', 'AMMO5': '0.016', 'weapon5': '0.094', 'weapon4': '0.100', 'WEAPON4': '0.150', 'AMMO3': '0.196', 'WEAPON5': '0.200', 'HITCOUNT': '0.260', 'WEAPON3': '0.900', 'weapon3': '1.412', 'DAMAGECOUNT': '1.731', 'weapon2': '1.886', 'FRAGCOUNT': '6.000'} +[2023-09-14 14:48:16,231][63771] DAMAGECOUNT value on done: 2792.0 +[2023-09-14 14:48:16,232][63771] Sum rewards: -5.265, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.350', 'AMMO2': '0.002', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO4': '0.012', 'WEAPON5': '0.100', 'AMMO3': '0.160', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.513', 'ARMOR': '0.515', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.514', 'weapon2': '1.538'} +[2023-09-14 14:48:17,437][63732] Updated weights for policy 0, policy_version 940 (0.0011) +[2023-09-14 14:48:17,465][63454] Saving new best policy, reward=-3.068! +[2023-09-14 14:48:17,555][63769] DAMAGECOUNT value on done: 2885.0 +[2023-09-14 14:48:17,555][63769] Sum rewards: -5.274, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.390', 'AMMO5': '0.003', 'weapon5': '0.004', 'AMMO2': '0.019', 'WEAPON5': '0.050', 'AMMO4': '0.097', 'WEAPON4': '0.100', 'AMMO3': '0.118', 'HITCOUNT': '0.170', 'weapon4': '0.190', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.675', 'weapon3': '1.242', 'FRAGCOUNT': '1.500', 'weapon2': '1.548'} +[2023-09-14 14:48:17,898][63769] DAMAGECOUNT value on done: 3943.0 +[2023-09-14 14:48:17,899][63769] Sum rewards: 0.716, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.820', 'AMMO5': '0.008', 'AMMO2': '0.024', 'weapon5': '0.078', 'weapon4': '0.094', 'ARMOR': '0.100', 'AMMO3': '0.111', 'AMMO4': '0.121', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'HITCOUNT': '0.210', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.182', 'weapon3': '1.478', 'weapon2': '1.630', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:48:18,196][63806] DAMAGECOUNT value on done: 3461.0 +[2023-09-14 14:48:18,362][63734] DAMAGECOUNT value on done: 2894.0 +[2023-09-14 14:48:18,362][63734] Sum rewards: -5.386, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.300', 'AMMO5': '0.010', 'AMMO2': '0.016', 'weapon5': '0.018', 'WEAPON1': '0.020', 'weapon4': '0.052', 'ARMOR': '0.072', 'AMMO4': '0.082', 'WEAPON4': '0.100', 'AMMO3': '0.133', 'WEAPON5': '0.150', 'HITCOUNT': '0.200', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.975', 'weapon2': '1.346', 'weapon3': '1.440', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:48:18,610][63769] DAMAGECOUNT value on done: 4339.0 +[2023-09-14 14:48:18,610][63769] Sum rewards: -2.514, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-2.177', 'AMMO4': '-0.024', 'AMMO2': '-0.005', 'AMMO5': '0.017', 'ARMOR': '0.080', 'weapon5': '0.096', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'HITCOUNT': '0.150', 'weapon4': '0.248', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.650', 'weapon2': '0.974', 'FRAGCOUNT': '1.000', 'weapon3': '1.590'} +[2023-09-14 14:48:18,654][63806] DAMAGECOUNT value on done: 2850.0 +[2023-09-14 14:48:18,655][63806] Sum rewards: -2.754, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.582', 'AMMO5': '0.005', 'AMMO2': '0.011', 'AMMO4': '0.055', 'AMMO3': '0.095', 'ARMOR': '0.100', 'weapon4': '0.124', 'WEAPON4': '0.150', 'HITCOUNT': '0.180', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.888', 'weapon2': '1.022', 'weapon3': '1.748', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:48:18,757][63734] DAMAGECOUNT value on done: 2996.0 +[2023-09-14 14:48:18,950][63769] DAMAGECOUNT value on done: 2169.0 +[2023-09-14 14:48:18,951][63769] Sum rewards: -2.216, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.654', 'weapon5': '0.002', 'AMMO5': '0.007', 'AMMO2': '0.019', 'WEAPON5': '0.050', 'AMMO3': '0.068', 'ARMOR': '0.084', 'HITCOUNT': '0.090', 'AMMO4': '0.096', 'WEAPON4': '0.200', 'weapon4': '0.258', 'DAMAGECOUNT': '0.345', 'WEAPON3': '0.350', 'weapon3': '0.682', 'FRAGCOUNT': '1.000', 'weapon2': '1.936'} +[2023-09-14 14:48:19,226][63770] DAMAGECOUNT value on done: 4056.0 +[2023-09-14 14:48:19,227][63770] Sum rewards: 1.409, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.170', 'AMMO2': '0.006', 'AMMO5': '0.020', 'AMMO4': '0.027', 'weapon7': '0.086', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.109', 'weapon4': '0.124', 'WEAPON4': '0.150', 'HITCOUNT': '0.180', 'weapon5': '0.302', 'WEAPON5': '0.400', 'ARMOR': '0.471', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.663', 'weapon2': '1.210', 'weapon3': '1.630', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:48:19,621][63770] DAMAGECOUNT value on done: 2844.0 +[2023-09-14 14:48:21,295][63733] Updated weights for policy 1, policy_version 980 (0.0011) +[2023-09-14 14:48:22,461][63454] Saving new best policy, reward=-2.890! +[2023-09-14 14:48:25,430][63732] Updated weights for policy 0, policy_version 950 (0.0012) +[2023-09-14 14:48:26,347][63735] DAMAGECOUNT value on done: 4008.0 +[2023-09-14 14:48:26,732][63735] DAMAGECOUNT value on done: 3848.0 +[2023-09-14 14:48:26,733][63735] Sum rewards: -6.519, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-1.910', 'AMMO5': '0.013', 'AMMO2': '0.019', 'weapon4': '0.030', 'weapon5': '0.050', 'AMMO4': '0.095', 'WEAPON5': '0.150', 'AMMO3': '0.186', 'WEAPON4': '0.200', 'HITCOUNT': '0.330', 'WEAPON3': '1.100', 'weapon2': '1.154', 'DAMAGECOUNT': '1.251', 'weapon3': '2.064', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:48:27,467][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000989_4050944.pth... +[2023-09-14 14:48:27,468][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000952_3899392.pth... +[2023-09-14 14:48:27,526][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000638_2613248.pth +[2023-09-14 14:48:27,527][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000652_2670592.pth +[2023-09-14 14:48:27,533][63454] Saving new best policy, reward=-2.883! +[2023-09-14 14:48:28,146][63733] Updated weights for policy 1, policy_version 990 (0.0011) +[2023-09-14 14:48:28,928][63805] DAMAGECOUNT value on done: 4529.0 +[2023-09-14 14:48:28,929][63805] Sum rewards: 0.758, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.628', 'AMMO5': '0.005', 'ARMOR': '0.020', 'AMMO2': '0.023', 'weapon4': '0.036', 'AMMO4': '0.114', 'AMMO3': '0.120', 'WEAPON4': '0.200', 'HITCOUNT': '0.230', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.086', 'weapon2': '1.412', 'weapon3': '1.740', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:48:29,326][63805] DAMAGECOUNT value on done: 3509.0 +[2023-09-14 14:48:29,327][63805] Sum rewards: -6.323, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.678', 'weapon5': '0.002', 'AMMO5': '0.007', 'ARMOR': '0.012', 'AMMO2': '0.015', 'WEAPON1': '0.030', 'AMMO4': '0.076', 'AMMO3': '0.106', 'HITCOUNT': '0.130', 'WEAPON5': '0.150', 'weapon4': '0.176', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.516', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.204', 'weapon3': '1.780'} +[2023-09-14 14:48:29,628][63771] DAMAGECOUNT value on done: 2575.0 +[2023-09-14 14:48:29,629][63771] Sum rewards: -6.100, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.914', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'AMMO2': '0.006', 'WEAPON1': '0.010', 'ARMOR': '0.012', 'AMMO4': '0.030', 'WEAPON4': '0.050', 'HITCOUNT': '0.070', 'AMMO3': '0.080', 'weapon5': '0.088', 'weapon7': '0.088', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.102', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.500', 'weapon3': '1.196', 'weapon2': '1.406'} +[2023-09-14 14:48:29,979][63771] DAMAGECOUNT value on done: 4026.0 +[2023-09-14 14:48:29,979][63771] Sum rewards: 0.286, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.564', 'AMMO2': '0.011', 'AMMO4': '0.056', 'AMMO3': '0.081', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'weapon4': '0.184', 'DAMAGECOUNT': '0.273', 'WEAPON3': '0.450', 'ARMOR': '0.508', 'weapon3': '0.826', 'weapon2': '1.520', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:48:30,638][63767] DAMAGECOUNT value on done: 4629.0 +[2023-09-14 14:48:30,639][63767] Sum rewards: -2.764, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.794', 'AMMO2': '0.005', 'AMMO4': '0.025', 'weapon4': '0.082', 'HITCOUNT': '0.100', 'ARMOR': '0.108', 'AMMO3': '0.123', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.750', 'weapon3': '1.554', 'weapon2': '1.682', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:48:30,839][63770] DAMAGECOUNT value on done: 3157.0 +[2023-09-14 14:48:30,840][63770] Sum rewards: -2.833, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.950', 'AMMO5': '0.007', 'AMMO2': '0.047', 'ARMOR': '0.056', 'AMMO3': '0.094', 'WEAPON5': '0.100', 'HITCOUNT': '0.150', 'AMMO4': '0.235', 'weapon4': '0.388', 'WEAPON4': '0.400', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.585', 'FRAGCOUNT': '1.000', 'weapon3': '1.166', 'weapon2': '1.638'} +[2023-09-14 14:48:31,014][63767] DAMAGECOUNT value on done: 4247.0 +[2023-09-14 14:48:31,015][63767] Sum rewards: -3.789, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.446', 'AMMO5': '0.010', 'ARMOR': '0.040', 'AMMO2': '0.042', 'weapon5': '0.100', 'AMMO3': '0.116', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'weapon4': '0.206', 'AMMO4': '0.212', 'WEAPON4': '0.450', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.106', 'weapon3': '1.284'} +[2023-09-14 14:48:31,224][63770] DAMAGECOUNT value on done: 3565.0 +[2023-09-14 14:48:31,225][63770] Sum rewards: -5.436, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.449', 'AMMO4': '-0.041', 'AMMO2': '-0.008', 'AMMO3': '0.193', 'HITCOUNT': '0.210', 'WEAPON3': '0.950', 'DAMAGECOUNT': '0.975', 'weapon3': '1.392', 'weapon2': '1.592', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:48:31,837][63735] DAMAGECOUNT value on done: 3628.0 +[2023-09-14 14:48:31,838][63735] Sum rewards: -5.076, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.840', 'AMMO4': '-0.004', 'AMMO2': '-0.001', 'AMMO5': '0.011', 'weapon4': '0.016', 'ARMOR': '0.059', 'WEAPON4': '0.150', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'weapon5': '0.150', 'AMMO3': '0.155', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.591', 'WEAPON3': '0.750', 'weapon3': '1.212', 'weapon2': '1.874'} +[2023-09-14 14:48:32,176][63735] DAMAGECOUNT value on done: 2578.0 +[2023-09-14 14:48:32,665][63767] DAMAGECOUNT value on done: 4955.0 +[2023-09-14 14:48:32,665][63767] Sum rewards: -1.507, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.065', 'AMMO2': '0.010', 'AMMO4': '0.048', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO3': '0.136', 'HITCOUNT': '0.140', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.750', 'weapon2': '1.236', 'weapon3': '1.774', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:48:33,026][63732] Updated weights for policy 0, policy_version 960 (0.0010) +[2023-09-14 14:48:33,060][63767] DAMAGECOUNT value on done: 4905.0 +[2023-09-14 14:48:35,038][63733] Updated weights for policy 1, policy_version 1000 (0.0010) +[2023-09-14 14:48:36,980][63806] DAMAGECOUNT value on done: 3785.0 +[2023-09-14 14:48:36,981][63806] Sum rewards: -8.826, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-3.172', 'AMMO4': '-0.008', 'AMMO2': '-0.002', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'AMMO3': '0.178', 'weapon4': '0.180', 'DAMAGECOUNT': '0.270', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.266', 'weapon2': '1.478'} +[2023-09-14 14:48:37,437][63806] DAMAGECOUNT value on done: 4426.0 +[2023-09-14 14:48:37,437][63806] Sum rewards: -0.857, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.350', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.020', 'ARMOR': '0.040', 'AMMO3': '0.100', 'weapon5': '0.114', 'WEAPON4': '0.200', 'HITCOUNT': '0.250', 'WEAPON5': '0.300', 'weapon4': '0.464', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.098', 'weapon2': '1.166', 'weapon3': '1.636', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:48:38,410][63734] DAMAGECOUNT value on done: 4623.0 +[2023-09-14 14:48:38,411][63734] Sum rewards: -2.825, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.725', 'AMMO5': '0.009', 'AMMO2': '0.021', 'ARMOR': '0.068', 'weapon5': '0.082', 'WEAPON4': '0.100', 'AMMO4': '0.107', 'AMMO3': '0.125', 'WEAPON5': '0.250', 'weapon4': '0.254', 'HITCOUNT': '0.290', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.915', 'weapon2': '1.302', 'weapon3': '1.426', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:48:38,855][63734] DAMAGECOUNT value on done: 3031.0 +[2023-09-14 14:48:38,856][63734] Sum rewards: -3.967, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.320', 'AMMO5': '0.003', 'AMMO2': '0.011', 'WEAPON5': '0.050', 'AMMO4': '0.053', 'ARMOR': '0.060', 'weapon5': '0.064', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'HITCOUNT': '0.160', 'weapon4': '0.198', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.650', 'weapon3': '1.000', 'DAMAGECOUNT': '1.104', 'weapon2': '1.538'} +[2023-09-14 14:48:39,082][63805] DAMAGECOUNT value on done: 4129.0 +[2023-09-14 14:48:39,083][63805] Sum rewards: -3.305, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.150', 'AMMO5': '0.007', 'AMMO2': '0.022', 'AMMO3': '0.072', 'HITCOUNT': '0.080', 'AMMO4': '0.108', 'weapon5': '0.112', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.330', 'WEAPON4': '0.350', 'WEAPON3': '0.450', 'weapon4': '0.470', 'weapon3': '0.924', 'FRAGCOUNT': '1.000', 'weapon2': '1.220'} +[2023-09-14 14:48:39,545][63805] DAMAGECOUNT value on done: 4978.0 +[2023-09-14 14:48:39,546][63805] Sum rewards: -6.231, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.452', 'weapon4': '0.012', 'AMMO2': '0.013', 'WEAPON4': '0.050', 'AMMO4': '0.067', 'ARMOR': '0.083', 'HITCOUNT': '0.170', 'AMMO3': '0.179', 'DAMAGECOUNT': '0.735', 'WEAPON3': '0.900', 'weapon3': '1.124', 'weapon2': '1.888', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:48:40,295][63806] DAMAGECOUNT value on done: 3814.0 +[2023-09-14 14:48:40,296][63806] Sum rewards: -1.961, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.470', 'AMMO4': '-0.028', 'AMMO2': '-0.005', 'AMMO5': '0.016', 'weapon7': '0.050', 'weapon5': '0.112', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.131', 'WEAPON7': '0.200', 'HITCOUNT': '0.250', 'WEAPON5': '0.300', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.059', 'weapon2': '1.314', 'weapon3': '1.420', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:48:40,507][63771] DAMAGECOUNT value on done: 4250.0 +[2023-09-14 14:48:40,507][63771] Sum rewards: -6.943, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.242', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'AMMO5': '0.024', 'weapon4': '0.026', 'AMMO4': '0.041', 'WEAPON4': '0.100', 'weapon5': '0.158', 'AMMO3': '0.178', 'HITCOUNT': '0.180', 'WEAPON5': '0.350', 'ARMOR': '0.496', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.810', 'WEAPON3': '0.950', 'weapon2': '1.408', 'weapon3': '1.810'} +[2023-09-14 14:48:40,620][63806] DAMAGECOUNT value on done: 3149.0 +[2023-09-14 14:48:40,621][63806] Sum rewards: 0.231, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.636', 'AMMO2': '0.004', 'AMMO5': '0.007', 'ARMOR': '0.012', 'AMMO4': '0.022', 'weapon5': '0.034', 'weapon7': '0.048', 'WEAPON5': '0.050', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.142', 'WEAPON4': '0.150', 'HITCOUNT': '0.190', 'WEAPON7': '0.200', 'weapon4': '0.208', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.897', 'weapon3': '1.286', 'weapon2': '1.676', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:48:40,935][63771] DAMAGECOUNT value on done: 2930.0 +[2023-09-14 14:48:41,004][63732] Updated weights for policy 0, policy_version 970 (0.0011) +[2023-09-14 14:48:41,775][63734] DAMAGECOUNT value on done: 3254.0 +[2023-09-14 14:48:41,776][63734] Sum rewards: -5.147, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.384', 'AMMO5': '0.003', 'ARMOR': '0.004', 'AMMO2': '0.021', 'WEAPON5': '0.050', 'AMMO3': '0.097', 'AMMO4': '0.106', 'weapon4': '0.136', 'WEAPON4': '0.200', 'HITCOUNT': '0.270', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.080', 'weapon3': '1.218', 'weapon2': '1.702', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:48:42,090][63733] Updated weights for policy 1, policy_version 1010 (0.0010) +[2023-09-14 14:48:42,203][63734] DAMAGECOUNT value on done: 3086.0 +[2023-09-14 14:48:42,673][63769] DAMAGECOUNT value on done: 3140.0 +[2023-09-14 14:48:42,674][63769] Sum rewards: -1.812, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.676', 'AMMO2': '0.008', 'AMMO5': '0.012', 'weapon5': '0.024', 'AMMO4': '0.040', 'WEAPON4': '0.050', 'ARMOR': '0.052', 'AMMO3': '0.064', 'WEAPON5': '0.150', 'HITCOUNT': '0.240', 'weapon4': '0.326', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.765', 'FRAGCOUNT': '1.000', 'weapon3': '1.202', 'weapon2': '1.330'} +[2023-09-14 14:48:43,066][63769] DAMAGECOUNT value on done: 4512.0 +[2023-09-14 14:48:43,066][63769] Sum rewards: -5.806, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-2.500', 'HEALTH': '-1.646', 'WEAPON1': '0.010', 'AMMO5': '0.018', 'AMMO2': '0.032', 'AMMO3': '0.120', 'AMMO4': '0.159', 'weapon5': '0.176', 'weapon4': '0.280', 'WEAPON4': '0.300', 'HITCOUNT': '0.310', 'WEAPON5': '0.450', 'ARMOR': '0.470', 'WEAPON3': '0.700', 'weapon2': '1.166', 'weapon3': '1.442', 'DAMAGECOUNT': '1.707'} +[2023-09-14 14:48:43,742][63769] DAMAGECOUNT value on done: 4596.0 +[2023-09-14 14:48:43,743][63769] Sum rewards: -1.759, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.200', 'weapon7': '0.002', 'AMMO5': '0.008', 'ARMOR': '0.008', 'AMMO2': '0.032', 'weapon5': '0.062', 'AMMO3': '0.122', 'AMMO4': '0.162', 'WEAPON5': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.200', 'weapon4': '0.230', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.771', 'WEAPON3': '0.800', 'weapon3': '1.140', 'weapon2': '1.254', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:48:44,146][63769] DAMAGECOUNT value on done: 2279.0 +[2023-09-14 14:48:44,147][63769] Sum rewards: -2.930, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.630', 'AMMO5': '0.005', 'AMMO2': '0.015', 'ARMOR': '0.020', 'WEAPON1': '0.020', 'AMMO4': '0.074', 'WEAPON5': '0.100', 'HITCOUNT': '0.120', 'AMMO3': '0.130', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.330', 'weapon4': '0.436', 'WEAPON3': '0.700', 'weapon2': '1.160', 'weapon3': '1.440', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:48:44,511][63770] DAMAGECOUNT value on done: 4396.0 +[2023-09-14 14:48:44,511][63770] Sum rewards: 0.448, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.498', 'AMMO5': '0.007', 'AMMO2': '0.028', 'ARMOR': '0.040', 'AMMO3': '0.100', 'weapon5': '0.126', 'HITCOUNT': '0.140', 'AMMO4': '0.142', 'WEAPON5': '0.150', 'WEAPON4': '0.250', 'weapon4': '0.286', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.020', 'weapon3': '1.250', 'weapon2': '1.306', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:48:44,912][63770] DAMAGECOUNT value on done: 2874.0 +[2023-09-14 14:48:47,467][63454] Saving new best policy, reward=-2.842! +[2023-09-14 14:48:47,884][63732] Updated weights for policy 0, policy_version 980 (0.0010) +[2023-09-14 14:48:50,406][63733] Updated weights for policy 1, policy_version 1020 (0.0011) +[2023-09-14 14:48:50,895][63735] DAMAGECOUNT value on done: 4358.0 +[2023-09-14 14:48:50,895][63735] Sum rewards: 0.050, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.528', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.060', 'AMMO4': '0.092', 'AMMO3': '0.150', 'WEAPON4': '0.150', 'weapon4': '0.244', 'HITCOUNT': '0.270', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.050', 'weapon2': '1.316', 'weapon3': '1.608', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:48:51,238][63735] DAMAGECOUNT value on done: 4068.0 +[2023-09-14 14:48:51,239][63735] Sum rewards: -3.464, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.483', 'AMMO2': '0.025', 'AMMO3': '0.066', 'AMMO4': '0.122', 'weapon4': '0.144', 'HITCOUNT': '0.180', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.660', 'weapon3': '1.014', 'weapon2': '1.858', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:48:51,417][63770] Large shaping reward -2.519 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.27, -90.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:48:52,461][63454] Saving new best policy, reward=-2.817! +[2023-09-14 14:48:52,670][63771] DAMAGECOUNT value on done: 2660.0 +[2023-09-14 14:48:52,671][63771] Sum rewards: -4.367, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.428', 'WEAPON1': '0.010', 'AMMO5': '0.013', 'AMMO2': '0.020', 'weapon5': '0.056', 'HITCOUNT': '0.070', 'ARMOR': '0.080', 'AMMO4': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.115', 'weapon4': '0.154', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.600', 'weapon3': '0.918', 'FRAGCOUNT': '1.000', 'weapon2': '1.570'} +[2023-09-14 14:48:53,055][63771] DAMAGECOUNT value on done: 4151.0 +[2023-09-14 14:48:53,056][63771] Sum rewards: -5.226, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.367', 'weapon5': '0.008', 'WEAPON1': '0.010', 'AMMO5': '0.010', 'AMMO2': '0.012', 'weapon4': '0.048', 'ARMOR': '0.056', 'AMMO4': '0.057', 'WEAPON5': '0.100', 'AMMO3': '0.125', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.426', 'weapon3': '1.684'} +[2023-09-14 14:48:53,289][63767] DAMAGECOUNT value on done: 5181.0 +[2023-09-14 14:48:53,289][63767] Sum rewards: -0.346, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.994', 'AMMO5': '0.010', 'AMMO2': '0.026', 'weapon4': '0.098', 'AMMO3': '0.109', 'AMMO4': '0.130', 'WEAPON5': '0.150', 'weapon5': '0.224', 'WEAPON4': '0.250', 'HITCOUNT': '0.270', 'WEAPON3': '0.500', 'weapon3': '1.410', 'weapon2': '1.564', 'DAMAGECOUNT': '1.656', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:48:53,619][63767] DAMAGECOUNT value on done: 4465.0 +[2023-09-14 14:48:53,777][63805] DAMAGECOUNT value on done: 5024.0 +[2023-09-14 14:48:53,778][63805] Sum rewards: 0.406, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.483', 'AMMO2': '0.005', 'AMMO5': '0.017', 'ARMOR': '0.024', 'AMMO4': '0.025', 'weapon5': '0.060', 'WEAPON4': '0.150', 'AMMO3': '0.170', 'WEAPON5': '0.300', 'weapon4': '0.362', 'HITCOUNT': '0.390', 'WEAPON3': '0.950', 'weapon2': '1.294', 'DAMAGECOUNT': '1.485', 'weapon3': '1.656', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:48:54,109][63805] DAMAGECOUNT value on done: 3660.0 +[2023-09-14 14:48:54,109][63805] Sum rewards: -2.133, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO2': '0.016', 'ARMOR': '0.040', 'AMMO4': '0.078', 'WEAPON4': '0.100', 'weapon4': '0.144', 'AMMO3': '0.150', 'HITCOUNT': '0.190', 'HEALTH': '0.272', 'DAMAGECOUNT': '0.453', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.362', 'weapon3': '1.612'} +[2023-09-14 14:48:54,408][63732] Updated weights for policy 0, policy_version 990 (0.0011) +[2023-09-14 14:48:55,043][63767] DAMAGECOUNT value on done: 5315.0 +[2023-09-14 14:48:55,044][63767] Sum rewards: 0.569, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.057', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.018', 'AMMO4': '0.091', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.135', 'HITCOUNT': '0.230', 'weapon4': '0.290', 'ARMOR': '0.504', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.080', 'weapon2': '1.240', 'weapon3': '1.374', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:48:55,399][63767] DAMAGECOUNT value on done: 5102.0 +[2023-09-14 14:48:55,400][63767] Sum rewards: -7.395, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.819', 'AMMO2': '0.004', 'AMMO5': '0.007', 'AMMO4': '0.019', 'WEAPON1': '0.020', 'ARMOR': '0.044', 'weapon4': '0.100', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'HITCOUNT': '0.160', 'AMMO3': '0.201', 'DAMAGECOUNT': '0.591', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon3': '1.572', 'weapon2': '1.606'} +[2023-09-14 14:48:56,109][63770] DAMAGECOUNT value on done: 3706.0 +[2023-09-14 14:48:56,110][63770] Sum rewards: 1.289, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.375', 'AMMO4': '-0.029', 'AMMO2': '-0.006', 'AMMO5': '0.005', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.112', 'AMMO3': '0.179', 'HITCOUNT': '0.450', 'ARMOR': '0.516', 'WEAPON3': '1.150', 'weapon2': '1.512', 'DAMAGECOUNT': '1.647', 'weapon3': '1.928', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:48:56,436][63735] DAMAGECOUNT value on done: 4082.0 +[2023-09-14 14:48:56,436][63735] Sum rewards: -6.966, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-2.250', 'AMMO4': '-0.056', 'AMMO2': '-0.011', 'AMMO5': '0.015', 'weapon5': '0.158', 'AMMO3': '0.192', 'HITCOUNT': '0.280', 'WEAPON5': '0.350', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.362', 'weapon3': '1.720', 'weapon2': '1.774', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:48:56,497][63770] DAMAGECOUNT value on done: 3650.0 +[2023-09-14 14:48:56,497][63770] Sum rewards: -5.989, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-2.000', 'HEALTH': '-1.030', 'AMMO2': '0.006', 'AMMO5': '0.007', 'AMMO4': '0.029', 'weapon5': '0.036', 'ARMOR': '0.040', 'HITCOUNT': '0.080', 'WEAPON5': '0.100', 'AMMO3': '0.115', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.750', 'weapon2': '1.386', 'weapon3': '1.736'} +[2023-09-14 14:48:56,760][63735] DAMAGECOUNT value on done: 2833.0 +[2023-09-14 14:48:56,760][63735] Sum rewards: -5.781, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.990', 'AMMO5': '0.003', 'weapon5': '0.010', 'AMMO2': '0.030', 'WEAPON5': '0.050', 'ARMOR': '0.080', 'AMMO4': '0.149', 'AMMO3': '0.149', 'HITCOUNT': '0.170', 'weapon4': '0.204', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.765', 'WEAPON3': '0.850', 'weapon3': '1.096', 'weapon2': '1.554', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:48:58,613][63733] Updated weights for policy 1, policy_version 1030 (0.0010) +[2023-09-14 14:49:00,921][63732] Updated weights for policy 0, policy_version 1000 (0.0010) +[2023-09-14 14:49:01,569][63806] DAMAGECOUNT value on done: 3879.0 +[2023-09-14 14:49:01,570][63806] Sum rewards: -10.279, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.245', 'AMMO2': '0.002', 'AMMO5': '0.009', 'AMMO4': '0.011', 'WEAPON1': '0.020', 'HITCOUNT': '0.080', 'AMMO3': '0.143', 'weapon5': '0.146', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.282', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.220', 'weapon2': '1.602'} +[2023-09-14 14:49:01,960][63806] DAMAGECOUNT value on done: 5001.0 +[2023-09-14 14:49:01,960][63806] Sum rewards: -1.918, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.400', 'AMMO5': '0.012', 'AMMO2': '0.033', 'ARMOR': '0.068', 'weapon5': '0.072', 'weapon4': '0.146', 'WEAPON5': '0.150', 'AMMO4': '0.166', 'AMMO3': '0.173', 'WEAPON4': '0.250', 'HITCOUNT': '0.420', 'WEAPON3': '0.700', 'weapon3': '1.448', 'DAMAGECOUNT': '1.725', 'weapon2': '1.868', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:49:03,138][63806] DAMAGECOUNT value on done: 3988.0 +[2023-09-14 14:49:03,138][63806] Sum rewards: -2.667, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.708', 'AMMO2': '0.003', 'AMMO5': '0.007', 'ARMOR': '0.016', 'AMMO4': '0.016', 'WEAPON4': '0.050', 'weapon4': '0.056', 'weapon5': '0.060', 'AMMO3': '0.150', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.522', 'WEAPON3': '0.900', 'weapon3': '1.520', 'weapon2': '1.620', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:49:03,530][63806] DAMAGECOUNT value on done: 3540.0 +[2023-09-14 14:49:03,531][63806] Sum rewards: -9.551, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-3.276', 'AMMO5': '0.014', 'AMMO2': '0.022', 'weapon4': '0.032', 'AMMO4': '0.109', 'weapon5': '0.144', 'WEAPON4': '0.250', 'AMMO3': '0.251', 'HITCOUNT': '0.340', 'WEAPON5': '0.350', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '1.173', 'WEAPON3': '1.300', 'weapon2': '1.492', 'weapon3': '1.998'} +[2023-09-14 14:49:03,553][63734] DAMAGECOUNT value on done: 5161.0 +[2023-09-14 14:49:03,553][63734] Sum rewards: 1.057, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.424', 'AMMO2': '0.011', 'AMMO5': '0.034', 'AMMO4': '0.057', 'weapon4': '0.080', 'AMMO3': '0.136', 'WEAPON4': '0.150', 'weapon5': '0.300', 'HITCOUNT': '0.360', 'WEAPON5': '0.500', 'WEAPON3': '0.900', 'weapon2': '1.238', 'DAMAGECOUNT': '1.614', 'weapon3': '1.850', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:49:03,941][63734] DAMAGECOUNT value on done: 3101.0 +[2023-09-14 14:49:04,063][63805] DAMAGECOUNT value on done: 4789.0 +[2023-09-14 14:49:04,063][63805] Sum rewards: 0.433, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.590', 'AMMO5': '0.007', 'AMMO2': '0.023', 'ARMOR': '0.024', 'weapon5': '0.108', 'AMMO4': '0.114', 'weapon4': '0.188', 'AMMO3': '0.192', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'HITCOUNT': '0.350', 'weapon2': '0.716', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.980', 'weapon3': '2.220', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:49:04,533][63805] DAMAGECOUNT value on done: 5018.0 +[2023-09-14 14:49:05,251][63734] DAMAGECOUNT value on done: 3460.0 +[2023-09-14 14:49:05,251][63734] Sum rewards: -10.016, reward structure: {'DEATHCOUNT': '-12.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.250', 'AMMO5': '0.010', 'AMMO2': '0.023', 'ARMOR': '0.044', 'HITCOUNT': '0.080', 'weapon4': '0.098', 'AMMO4': '0.115', 'AMMO3': '0.151', 'weapon5': '0.170', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.618', 'WEAPON3': '0.800', 'weapon3': '1.322', 'weapon2': '1.652'} +[2023-09-14 14:49:05,435][63771] DAMAGECOUNT value on done: 4874.0 +[2023-09-14 14:49:05,435][63771] Sum rewards: 1.355, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.758', 'AMMO2': '0.005', 'AMMO5': '0.015', 'AMMO4': '0.026', 'WEAPON4': '0.050', 'weapon4': '0.104', 'AMMO3': '0.162', 'weapon5': '0.192', 'WEAPON5': '0.200', 'HITCOUNT': '0.300', 'ARMOR': '0.454', 'WEAPON3': '0.850', 'weapon2': '1.596', 'weapon3': '1.786', 'DAMAGECOUNT': '1.872', 'FRAGCOUNT': '3.500'} +[2023-09-14 14:49:05,628][63734] DAMAGECOUNT value on done: 3260.0 +[2023-09-14 14:49:05,628][63734] Sum rewards: -2.303, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.415', 'AMMO2': '0.003', 'AMMO4': '0.016', 'weapon7': '0.078', 'AMMO3': '0.101', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.150', 'HITCOUNT': '0.160', 'weapon4': '0.188', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.522', 'WEAPON3': '0.550', 'weapon3': '0.960', 'FRAGCOUNT': '1.000', 'weapon2': '1.694'} +[2023-09-14 14:49:05,872][63771] DAMAGECOUNT value on done: 3075.0 +[2023-09-14 14:49:05,872][63771] Sum rewards: -2.566, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.676', 'AMMO2': '0.003', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO4': '0.013', 'weapon5': '0.034', 'AMMO3': '0.089', 'HITCOUNT': '0.130', 'WEAPON5': '0.150', 'ARMOR': '0.424', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.600', 'weapon3': '1.294', 'weapon2': '1.420', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:49:07,011][63733] Updated weights for policy 1, policy_version 1040 (0.0012) +[2023-09-14 14:49:07,332][63769] DAMAGECOUNT value on done: 5031.0 +[2023-09-14 14:49:07,333][63769] Sum rewards: -2.924, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.585', 'AMMO2': '0.013', 'AMMO4': '0.064', 'AMMO3': '0.180', 'WEAPON4': '0.200', 'weapon4': '0.266', 'HITCOUNT': '0.290', 'ARMOR': '0.483', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.305', 'weapon2': '1.630', 'weapon3': '1.630', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:49:07,467][63454] Saving new best policy, reward=-2.753! +[2023-09-14 14:49:07,615][63732] Updated weights for policy 0, policy_version 1010 (0.0010) +[2023-09-14 14:49:07,724][63769] DAMAGECOUNT value on done: 2590.0 +[2023-09-14 14:49:07,725][63769] Sum rewards: -0.638, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.955', 'AMMO2': '0.021', 'AMMO3': '0.087', 'AMMO4': '0.106', 'ARMOR': '0.108', 'WEAPON4': '0.200', 'HITCOUNT': '0.260', 'weapon4': '0.316', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.933', 'FRAGCOUNT': '1.000', 'weapon3': '1.270', 'weapon2': '2.216'} +[2023-09-14 14:49:07,983][63769] DAMAGECOUNT value on done: 3389.0 +[2023-09-14 14:49:07,983][63769] Sum rewards: -6.365, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.802', 'AMMO2': '0.001', 'AMMO4': '0.005', 'AMMO5': '0.010', 'weapon5': '0.010', 'ARMOR': '0.036', 'WEAPON5': '0.100', 'HITCOUNT': '0.180', 'AMMO3': '0.204', 'DAMAGECOUNT': '0.747', 'WEAPON3': '0.800', 'weapon3': '1.360', 'weapon2': '1.734', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:49:08,388][63769] DAMAGECOUNT value on done: 4774.0 +[2023-09-14 14:49:08,388][63769] Sum rewards: -2.783, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.640', 'AMMO5': '0.007', 'ARMOR': '0.016', 'AMMO2': '0.029', 'weapon5': '0.050', 'AMMO3': '0.081', 'AMMO4': '0.143', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON4': '0.400', 'weapon4': '0.490', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.786', 'FRAGCOUNT': '1.000', 'weapon2': '1.060', 'weapon3': '1.544'} +[2023-09-14 14:49:09,809][63770] DAMAGECOUNT value on done: 5328.0 +[2023-09-14 14:49:09,809][63770] Sum rewards: 3.174, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.176', 'AMMO5': '0.018', 'AMMO2': '0.028', 'ARMOR': '0.040', 'weapon4': '0.134', 'AMMO4': '0.141', 'AMMO3': '0.167', 'weapon5': '0.236', 'WEAPON4': '0.250', 'HITCOUNT': '0.270', 'WEAPON5': '0.400', 'WEAPON3': '0.900', 'weapon2': '1.584', 'weapon3': '1.636', 'DAMAGECOUNT': '2.796', 'FRAGCOUNT': '5.500'} +[2023-09-14 14:49:10,200][63770] DAMAGECOUNT value on done: 3044.0 +[2023-09-14 14:49:10,201][63770] Sum rewards: -4.628, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.422', 'weapon4': '0.006', 'AMMO2': '0.011', 'WEAPON1': '0.030', 'AMMO4': '0.056', 'ARMOR': '0.092', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.118', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.056', 'weapon2': '2.004'} +[2023-09-14 14:49:12,461][63454] Saving new best policy, reward=-2.670! +[2023-09-14 14:49:14,021][63732] Updated weights for policy 0, policy_version 1020 (0.0011) +[2023-09-14 14:49:15,097][63771] DAMAGECOUNT value on done: 2745.0 +[2023-09-14 14:49:15,097][63771] Sum rewards: -5.797, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.358', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'AMMO5': '0.005', 'ARMOR': '0.051', 'HITCOUNT': '0.090', 'WEAPON5': '0.100', 'AMMO3': '0.174', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.412', 'weapon2': '1.638'} +[2023-09-14 14:49:15,449][63733] Updated weights for policy 1, policy_version 1050 (0.0011) +[2023-09-14 14:49:15,479][63771] DAMAGECOUNT value on done: 4421.0 +[2023-09-14 14:49:15,480][63771] Sum rewards: -2.299, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.760', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'AMMO5': '0.007', 'weapon5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'weapon4': '0.064', 'AMMO3': '0.139', 'HITCOUNT': '0.200', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.810', 'weapon3': '1.508', 'weapon2': '1.762', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:49:15,603][63735] DAMAGECOUNT value on done: 4623.0 +[2023-09-14 14:49:15,604][63735] Sum rewards: -4.235, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.646', 'AMMO2': '0.002', 'AMMO4': '0.008', 'weapon4': '0.038', 'WEAPON4': '0.050', 'AMMO3': '0.122', 'HITCOUNT': '0.150', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.795', 'FRAGCOUNT': '1.000', 'weapon3': '1.638', 'weapon2': '1.708'} +[2023-09-14 14:49:15,952][63735] DAMAGECOUNT value on done: 4408.0 +[2023-09-14 14:49:15,952][63735] Sum rewards: -1.962, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.489', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO2': '0.027', 'ARMOR': '0.068', 'weapon5': '0.120', 'AMMO4': '0.134', 'AMMO3': '0.148', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'HITCOUNT': '0.280', 'weapon4': '0.322', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.020', 'weapon3': '1.224', 'weapon2': '1.802', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:49:16,199][63767] DAMAGECOUNT value on done: 5741.0 +[2023-09-14 14:49:16,199][63767] Sum rewards: -4.756, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.157', 'AMMO2': '0.009', 'weapon4': '0.012', 'AMMO5': '0.013', 'WEAPON1': '0.030', 'AMMO4': '0.046', 'WEAPON4': '0.050', 'AMMO3': '0.170', 'weapon5': '0.174', 'WEAPON5': '0.350', 'HITCOUNT': '0.470', 'WEAPON3': '0.750', 'weapon3': '1.578', 'DAMAGECOUNT': '1.680', 'weapon2': '1.818', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:49:16,529][63767] DAMAGECOUNT value on done: 5167.0 +[2023-09-14 14:49:16,529][63767] Sum rewards: -0.763, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.336', 'AMMO5': '0.007', 'AMMO2': '0.029', 'weapon5': '0.056', 'ARMOR': '0.064', 'AMMO4': '0.143', 'WEAPON5': '0.150', 'AMMO3': '0.162', 'WEAPON4': '0.200', 'HITCOUNT': '0.440', 'weapon2': '0.534', 'weapon4': '0.566', 'WEAPON3': '1.050', 'DAMAGECOUNT': '2.106', 'weapon3': '2.316', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:49:17,212][63767] DAMAGECOUNT value on done: 5375.0 +[2023-09-14 14:49:17,536][63767] DAMAGECOUNT value on done: 5455.0 +[2023-09-14 14:49:17,537][63767] Sum rewards: -5.246, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.701', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'weapon5': '0.048', 'WEAPON4': '0.050', 'AMMO4': '0.054', 'weapon4': '0.082', 'WEAPON5': '0.100', 'AMMO3': '0.162', 'HITCOUNT': '0.260', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.950', 'weapon2': '1.054', 'DAMAGECOUNT': '1.059', 'weapon3': '1.860'} +[2023-09-14 14:49:18,754][63805] DAMAGECOUNT value on done: 5344.0 +[2023-09-14 14:49:18,754][63805] Sum rewards: 1.434, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.294', 'AMMO2': '0.013', 'AMMO5': '0.021', 'AMMO3': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.064', 'weapon4': '0.078', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'HITCOUNT': '0.150', 'weapon7': '0.194', 'weapon5': '0.228', 'WEAPON3': '0.350', 'WEAPON5': '0.400', 'ARMOR': '0.436', 'weapon3': '0.928', 'DAMAGECOUNT': '0.960', 'weapon2': '1.506', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:49:19,149][63805] DAMAGECOUNT value on done: 3830.0 +[2023-09-14 14:49:19,149][63805] Sum rewards: -6.516, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.320', 'AMMO2': '0.008', 'AMMO5': '0.010', 'ARMOR': '0.040', 'AMMO4': '0.041', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.169', 'WEAPON4': '0.200', 'weapon4': '0.410', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.262', 'weapon2': '1.344'} +[2023-09-14 14:49:20,637][63732] Updated weights for policy 0, policy_version 1030 (0.0010) +[2023-09-14 14:49:21,176][63735] DAMAGECOUNT value on done: 4470.0 +[2023-09-14 14:49:21,176][63735] Sum rewards: -5.209, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.752', 'AMMO5': '0.008', 'AMMO2': '0.009', 'AMMO4': '0.046', 'WEAPON4': '0.050', 'weapon4': '0.068', 'weapon5': '0.096', 'WEAPON5': '0.100', 'AMMO3': '0.220', 'HITCOUNT': '0.220', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.164', 'weapon3': '1.482', 'FRAGCOUNT': '2.000', 'weapon2': '2.030'} +[2023-09-14 14:49:21,385][63770] DAMAGECOUNT value on done: 3846.0 +[2023-09-14 14:49:21,386][63770] Sum rewards: -5.353, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.126', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'weapon4': '0.012', 'AMMO4': '0.017', 'ARMOR': '0.076', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.116', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.184', 'weapon2': '1.974'} +[2023-09-14 14:49:21,570][63735] DAMAGECOUNT value on done: 2963.0 +[2023-09-14 14:49:21,571][63735] Sum rewards: -7.044, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.792', 'AMMO5': '0.005', 'AMMO2': '0.007', 'AMMO4': '0.034', 'HITCOUNT': '0.100', 'AMMO3': '0.158', 'DAMAGECOUNT': '0.390', 'ARMOR': '0.404', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.546', 'weapon3': '1.554'} +[2023-09-14 14:49:21,737][63770] DAMAGECOUNT value on done: 3851.0 +[2023-09-14 14:49:21,737][63770] Sum rewards: 1.401, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.911', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO3': '0.060', 'weapon7': '0.090', 'HITCOUNT': '0.100', 'ARMOR': '0.104', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'WEAPON4': '0.250', 'WEAPON3': '0.500', 'weapon4': '0.550', 'DAMAGECOUNT': '0.603', 'weapon3': '1.298', 'weapon2': '1.562', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:49:22,501][63454] Saving new best policy, reward=-2.607! +[2023-09-14 14:49:23,856][63733] Updated weights for policy 1, policy_version 1060 (0.0010) +[2023-09-14 14:49:26,051][63806] DAMAGECOUNT value on done: 3954.0 +[2023-09-14 14:49:26,051][63806] Sum rewards: -1.770, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.358', 'AMMO2': '0.015', 'ARMOR': '0.064', 'AMMO4': '0.076', 'HITCOUNT': '0.080', 'AMMO3': '0.092', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.225', 'weapon4': '0.328', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.136', 'weapon3': '1.622'} +[2023-09-14 14:49:26,183][63806] DAMAGECOUNT value on done: 4233.0 +[2023-09-14 14:49:26,184][63806] Sum rewards: 0.336, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.542', 'AMMO2': '0.003', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.015', 'weapon7': '0.044', 'WEAPON4': '0.050', 'ARMOR': '0.056', 'weapon5': '0.108', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.140', 'AMMO3': '0.144', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.214', 'DAMAGECOUNT': '0.735', 'WEAPON3': '0.800', 'weapon2': '1.522', 'weapon3': '1.634', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:49:26,425][63806] DAMAGECOUNT value on done: 5585.0 +[2023-09-14 14:49:26,425][63806] Sum rewards: 2.030, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.458', 'AMMO2': '0.005', 'AMMO5': '0.016', 'AMMO4': '0.026', 'weapon5': '0.154', 'AMMO3': '0.208', 'WEAPON5': '0.250', 'ARMOR': '0.483', 'HITCOUNT': '0.490', 'WEAPON3': '1.000', 'weapon2': '1.114', 'DAMAGECOUNT': '1.752', 'weapon3': '2.490', 'FRAGCOUNT': '6.000'} +[2023-09-14 14:49:26,559][63806] DAMAGECOUNT value on done: 4115.0 +[2023-09-14 14:49:26,559][63806] Sum rewards: 2.494, reward structure: {'DEATHCOUNT': '-9.000', 'WEAPON1': '0.010', 'AMMO5': '0.019', 'AMMO2': '0.024', 'ARMOR': '0.064', 'AMMO4': '0.118', 'AMMO3': '0.122', 'WEAPON4': '0.150', 'HEALTH': '0.164', 'weapon4': '0.228', 'WEAPON5': '0.250', 'weapon5': '0.252', 'HITCOUNT': '0.320', 'WEAPON3': '0.650', 'weapon2': '1.172', 'DAMAGECOUNT': '1.725', 'weapon3': '1.726', 'FRAGCOUNT': '4.500'} +[2023-09-14 14:49:27,082][63732] Updated weights for policy 0, policy_version 1040 (0.0011) +[2023-09-14 14:49:27,465][63454] Saving new best policy, reward=-2.497! +[2023-09-14 14:49:28,528][63734] DAMAGECOUNT value on done: 5251.0 +[2023-09-14 14:49:28,821][63734] DAMAGECOUNT value on done: 3973.0 +[2023-09-14 14:49:28,821][63734] Sum rewards: -2.103, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.706', 'AMMO2': '0.003', 'AMMO5': '0.011', 'AMMO4': '0.017', 'weapon5': '0.098', 'WEAPON4': '0.100', 'AMMO3': '0.175', 'WEAPON5': '0.250', 'weapon4': '0.254', 'HITCOUNT': '0.390', 'WEAPON3': '0.850', 'ARMOR': '0.915', 'weapon2': '1.470', 'FRAGCOUNT': '1.500', 'DAMAGECOUNT': '1.539', 'weapon3': '1.780'} +[2023-09-14 14:49:28,923][63734] DAMAGECOUNT value on done: 3294.0 +[2023-09-14 14:49:28,924][63734] Sum rewards: -4.464, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.608', 'AMMO5': '0.005', 'AMMO2': '0.012', 'AMMO4': '0.059', 'weapon4': '0.062', 'WEAPON4': '0.100', 'AMMO3': '0.127', 'HITCOUNT': '0.240', 'ARMOR': '0.428', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.579', 'weapon3': '1.448', 'FRAGCOUNT': '2.000', 'weapon2': '2.084'} +[2023-09-14 14:49:29,000][63805] DAMAGECOUNT value on done: 4976.0 +[2023-09-14 14:49:29,000][63805] Sum rewards: -7.480, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-0.869', 'AMMO5': '0.005', 'AMMO2': '0.028', 'ARMOR': '0.056', 'WEAPON5': '0.100', 'AMMO4': '0.141', 'HITCOUNT': '0.160', 'AMMO3': '0.194', 'WEAPON4': '0.200', 'weapon4': '0.260', 'DAMAGECOUNT': '0.561', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '1.512', 'weapon2': '1.722'} +[2023-09-14 14:49:29,226][63734] DAMAGECOUNT value on done: 3370.0 +[2023-09-14 14:49:29,226][63734] Sum rewards: 0.695, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'ARMOR': '0.064', 'weapon4': '0.072', 'AMMO4': '0.082', 'AMMO3': '0.084', 'WEAPON4': '0.100', 'weapon5': '0.110', 'HITCOUNT': '0.120', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.330', 'HEALTH': '0.358', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.442', 'weapon2': '1.448'} +[2023-09-14 14:49:29,411][63805] DAMAGECOUNT value on done: 5208.0 +[2023-09-14 14:49:29,411][63805] Sum rewards: -2.148, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.940', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.005', 'weapon5': '0.022', 'ARMOR': '0.032', 'AMMO3': '0.098', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.466', 'weapon2': '1.544'} +[2023-09-14 14:49:30,299][63771] DAMAGECOUNT value on done: 4988.0 +[2023-09-14 14:49:30,299][63771] Sum rewards: -1.669, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.184', 'AMMO2': '0.014', 'AMMO5': '0.015', 'ARMOR': '0.048', 'AMMO4': '0.068', 'AMMO3': '0.088', 'weapon5': '0.092', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.130', 'weapon7': '0.154', 'WEAPON7': '0.200', 'WEAPON4': '0.250', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.342', 'WEAPON3': '0.500', 'weapon4': '0.508', 'FRAGCOUNT': '1.000', 'weapon3': '1.002', 'weapon2': '1.314'} +[2023-09-14 14:49:30,734][63771] DAMAGECOUNT value on done: 3262.0 +[2023-09-14 14:49:30,735][63771] Sum rewards: -7.991, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.028', 'AMMO2': '0.011', 'AMMO5': '0.011', 'ARMOR': '0.020', 'AMMO4': '0.055', 'weapon5': '0.080', 'AMMO3': '0.160', 'HITCOUNT': '0.160', 'WEAPON5': '0.250', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.561', 'WEAPON3': '0.800', 'weapon2': '1.200', 'weapon3': '1.978'} +[2023-09-14 14:49:30,974][63769] DAMAGECOUNT value on done: 5140.0 +[2023-09-14 14:49:30,975][63769] Sum rewards: -4.106, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.000', 'AMMO2': '0.009', 'AMMO5': '0.015', 'AMMO4': '0.043', 'weapon5': '0.098', 'AMMO3': '0.119', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'WEAPON5': '0.250', 'weapon4': '0.306', 'DAMAGECOUNT': '0.327', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.224', 'weapon3': '1.622'} +[2023-09-14 14:49:31,392][63769] DAMAGECOUNT value on done: 2795.0 +[2023-09-14 14:49:31,392][63769] Sum rewards: -8.741, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-1.950', 'AMMO5': '0.009', 'AMMO2': '0.010', 'weapon5': '0.030', 'AMMO4': '0.049', 'ARMOR': '0.068', 'WEAPON5': '0.100', 'WEAPON4': '0.150', 'AMMO3': '0.153', 'weapon4': '0.168', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.615', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.170', 'weapon3': '2.016'} +[2023-09-14 14:49:32,311][63733] Updated weights for policy 1, policy_version 1070 (0.0011) +[2023-09-14 14:49:32,461][63454] Saving new best policy, reward=-2.468! +[2023-09-14 14:49:33,091][63769] DAMAGECOUNT value on done: 3643.0 +[2023-09-14 14:49:33,091][63769] Sum rewards: -2.413, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.300', 'AMMO5': '0.017', 'AMMO2': '0.029', 'weapon5': '0.072', 'AMMO3': '0.122', 'HITCOUNT': '0.140', 'AMMO4': '0.145', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'weapon4': '0.316', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.762', 'weapon2': '1.398', 'weapon3': '1.736', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:49:33,427][63769] DAMAGECOUNT value on done: 5089.0 +[2023-09-14 14:49:33,427][63769] Sum rewards: -6.785, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.916', 'AMMO2': '0.006', 'WEAPON1': '0.010', 'AMMO5': '0.018', 'AMMO4': '0.029', 'weapon5': '0.038', 'ARMOR': '0.069', 'AMMO3': '0.158', 'WEAPON4': '0.200', 'weapon4': '0.206', 'HITCOUNT': '0.240', 'WEAPON5': '0.350', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.945', 'WEAPON3': '1.000', 'weapon2': '1.310', 'weapon3': '1.552'} +[2023-09-14 14:49:33,658][63732] Updated weights for policy 0, policy_version 1050 (0.0010) +[2023-09-14 14:49:35,053][63770] DAMAGECOUNT value on done: 5725.0 +[2023-09-14 14:49:35,054][63770] Sum rewards: 1.545, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.931', 'AMMO4': '-0.053', 'AMMO2': '-0.011', 'AMMO5': '0.014', 'weapon7': '0.064', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.141', 'HITCOUNT': '0.160', 'weapon5': '0.182', 'weapon4': '0.192', 'WEAPON5': '0.300', 'ARMOR': '0.467', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.191', 'weapon2': '1.274', 'weapon3': '1.704', 'FRAGCOUNT': '3.500'} +[2023-09-14 14:49:35,402][63770] DAMAGECOUNT value on done: 3149.0 +[2023-09-14 14:49:35,402][63770] Sum rewards: -3.171, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.635', 'AMMO5': '0.003', 'AMMO2': '0.003', 'weapon5': '0.010', 'AMMO4': '0.016', 'WEAPON5': '0.050', 'HITCOUNT': '0.100', 'AMMO3': '0.137', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.850', 'weapon2': '1.308', 'weapon3': '1.922', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:49:37,854][63771] DAMAGECOUNT value on done: 2790.0 +[2023-09-14 14:49:38,252][63771] DAMAGECOUNT value on done: 4707.0 +[2023-09-14 14:49:38,252][63771] Sum rewards: -5.998, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-3.300', 'AMMO4': '-0.029', 'AMMO2': '-0.006', 'AMMO5': '0.005', 'weapon5': '0.008', 'ARMOR': '0.028', 'WEAPON5': '0.100', 'HITCOUNT': '0.180', 'AMMO3': '0.186', 'DAMAGECOUNT': '0.858', 'WEAPON3': '1.050', 'weapon2': '1.470', 'weapon3': '1.702', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:49:39,296][63767] DAMAGECOUNT value on done: 6180.0 +[2023-09-14 14:49:39,297][63767] Sum rewards: 4.534, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-0.495', 'AMMO2': '0.001', 'AMMO4': '0.006', 'AMMO5': '0.007', 'ARMOR': '0.032', 'weapon5': '0.048', 'WEAPON5': '0.100', 'AMMO3': '0.103', 'HITCOUNT': '0.280', 'WEAPON3': '0.350', 'weapon2': '1.168', 'DAMAGECOUNT': '1.317', 'weapon3': '1.616', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:49:39,474][63767] DAMAGECOUNT value on done: 5634.0 +[2023-09-14 14:49:39,474][63767] Sum rewards: -9.964, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.890', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'AMMO5': '0.005', 'weapon5': '0.016', 'WEAPON5': '0.050', 'ARMOR': '0.056', 'AMMO3': '0.170', 'HITCOUNT': '0.240', 'DAMAGECOUNT': '0.777', 'WEAPON3': '1.000', 'weapon2': '1.506', 'weapon3': '1.622'} +[2023-09-14 14:49:39,689][63767] DAMAGECOUNT value on done: 5454.0 +[2023-09-14 14:49:39,690][63767] Sum rewards: -4.481, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.140', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'AMMO2': '0.017', 'ARMOR': '0.028', 'AMMO4': '0.085', 'WEAPON4': '0.100', 'AMMO3': '0.163', 'weapon5': '0.174', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'weapon4': '0.474', 'DAMAGECOUNT': '0.861', 'WEAPON3': '0.900', 'weapon2': '0.938', 'FRAGCOUNT': '1.000', 'weapon3': '1.922'} +[2023-09-14 14:49:39,872][63767] DAMAGECOUNT value on done: 5843.0 +[2023-09-14 14:49:39,872][63767] Sum rewards: 2.237, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.038', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'weapon4': '0.102', 'AMMO3': '0.138', 'HITCOUNT': '0.370', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.164', 'weapon2': '1.284', 'weapon3': '1.654', 'FRAGCOUNT': '6.000'} +[2023-09-14 14:49:40,238][63732] Updated weights for policy 0, policy_version 1060 (0.0011) +[2023-09-14 14:49:40,329][63735] DAMAGECOUNT value on done: 4668.0 +[2023-09-14 14:49:40,330][63735] Sum rewards: -2.262, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.149', 'AMMO5': '0.003', 'weapon5': '0.016', 'AMMO2': '0.019', 'ARMOR': '0.036', 'WEAPON5': '0.050', 'HITCOUNT': '0.060', 'AMMO4': '0.092', 'AMMO3': '0.104', 'DAMAGECOUNT': '0.135', 'WEAPON4': '0.150', 'weapon4': '0.240', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.306', 'weapon3': '1.576'} +[2023-09-14 14:49:40,697][63733] Updated weights for policy 1, policy_version 1080 (0.0010) +[2023-09-14 14:49:40,706][63735] DAMAGECOUNT value on done: 4518.0 +[2023-09-14 14:49:40,707][63735] Sum rewards: -7.782, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.262', 'FRAGCOUNT': '-1.500', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'AMMO5': '0.007', 'weapon5': '0.072', 'ARMOR': '0.099', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'AMMO3': '0.196', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.330', 'weapon4': '0.432', 'WEAPON3': '0.950', 'weapon3': '1.336', 'weapon2': '1.816'} +[2023-09-14 14:49:43,674][63805] DAMAGECOUNT value on done: 6019.0 +[2023-09-14 14:49:43,674][63805] Sum rewards: -2.050, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.682', 'AMMO5': '0.007', 'AMMO2': '0.017', 'ARMOR': '0.072', 'AMMO4': '0.083', 'WEAPON5': '0.100', 'AMMO3': '0.173', 'HITCOUNT': '0.430', 'WEAPON3': '0.900', 'weapon3': '1.858', 'weapon2': '1.966', 'DAMAGECOUNT': '2.025', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:49:44,020][63805] DAMAGECOUNT value on done: 4020.0 +[2023-09-14 14:49:44,021][63805] Sum rewards: -3.266, reward structure: {'DEATHCOUNT': '-9.000', 'AMMO2': '0.017', 'WEAPON4': '0.050', 'weapon4': '0.080', 'AMMO4': '0.083', 'HEALTH': '0.101', 'ARMOR': '0.106', 'HITCOUNT': '0.130', 'AMMO3': '0.151', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.570', 'FRAGCOUNT': '1.000', 'weapon3': '1.212', 'weapon2': '1.734'} +[2023-09-14 14:49:45,928][63735] DAMAGECOUNT value on done: 4685.0 +[2023-09-14 14:49:45,928][63735] Sum rewards: -7.719, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.922', 'AMMO5': '0.003', 'AMMO2': '0.007', 'weapon5': '0.014', 'AMMO4': '0.034', 'WEAPON5': '0.050', 'ARMOR': '0.056', 'AMMO3': '0.193', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.645', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.100', 'weapon2': '1.820', 'weapon3': '1.822'} +[2023-09-14 14:49:46,334][63735] DAMAGECOUNT value on done: 2978.0 +[2023-09-14 14:49:46,641][63770] DAMAGECOUNT value on done: 4101.0 +[2023-09-14 14:49:46,641][63770] Sum rewards: -5.735, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.420', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'AMMO5': '0.007', 'weapon5': '0.038', 'WEAPON5': '0.150', 'AMMO3': '0.157', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.765', 'WEAPON3': '0.900', 'weapon2': '1.446', 'weapon3': '1.558', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:49:46,861][63732] Updated weights for policy 0, policy_version 1070 (0.0012) +[2023-09-14 14:49:47,096][63770] DAMAGECOUNT value on done: 3959.0 +[2023-09-14 14:49:47,097][63770] Sum rewards: 0.577, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.423', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.020', 'AMMO4': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.119', 'weapon5': '0.120', 'HITCOUNT': '0.130', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.324', 'weapon4': '0.426', 'ARMOR': '0.480', 'WEAPON3': '0.750', 'weapon2': '1.190', 'weapon3': '1.826', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:49:47,466][63454] Saving new best policy, reward=-2.434! +[2023-09-14 14:49:49,230][63733] Updated weights for policy 1, policy_version 1090 (0.0011) +[2023-09-14 14:49:49,392][63806] DAMAGECOUNT value on done: 4533.0 +[2023-09-14 14:49:49,393][63806] Sum rewards: -5.620, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.504', 'AMMO5': '0.005', 'AMMO2': '0.008', 'AMMO4': '0.040', 'ARMOR': '0.046', 'WEAPON5': '0.100', 'AMMO3': '0.174', 'WEAPON4': '0.200', 'HITCOUNT': '0.290', 'weapon4': '0.482', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.330', 'weapon3': '1.658'} +[2023-09-14 14:49:49,750][63806] DAMAGECOUNT value on done: 4385.0 +[2023-09-14 14:49:49,750][63806] Sum rewards: -1.281, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.800', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.005', 'weapon4': '0.040', 'ARMOR': '0.052', 'weapon5': '0.054', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.151', 'HITCOUNT': '0.230', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.810', 'weapon2': '1.622', 'weapon3': '1.816', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:49:50,569][63806] DAMAGECOUNT value on done: 3991.0 +[2023-09-14 14:49:50,570][63806] Sum rewards: -10.948, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.804', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.010', 'AMMO2': '0.021', 'weapon5': '0.034', 'HITCOUNT': '0.040', 'WEAPON5': '0.100', 'AMMO4': '0.103', 'DAMAGECOUNT': '0.111', 'weapon4': '0.134', 'AMMO3': '0.163', 'WEAPON4': '0.200', 'ARMOR': '0.464', 'WEAPON3': '0.950', 'weapon3': '1.352', 'weapon2': '1.424'} +[2023-09-14 14:49:50,943][63806] DAMAGECOUNT value on done: 5915.0 +[2023-09-14 14:49:50,943][63806] Sum rewards: -1.128, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.274', 'AMMO5': '0.003', 'AMMO2': '0.015', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'weapon5': '0.054', 'weapon7': '0.068', 'AMMO4': '0.073', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.131', 'WEAPON7': '0.200', 'weapon4': '0.214', 'HITCOUNT': '0.310', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.990', 'FRAGCOUNT': '1.000', 'weapon3': '1.360', 'weapon2': '1.988'} +[2023-09-14 14:49:52,730][63734] DAMAGECOUNT value on done: 4345.0 +[2023-09-14 14:49:52,731][63734] Sum rewards: -1.936, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.452', 'AMMO5': '0.009', 'AMMO2': '0.011', 'ARMOR': '0.024', 'weapon7': '0.050', 'AMMO4': '0.054', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon5': '0.132', 'AMMO3': '0.142', 'HITCOUNT': '0.160', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.116', 'weapon3': '1.534', 'weapon2': '1.894'} +[2023-09-14 14:49:53,115][63734] DAMAGECOUNT value on done: 3602.0 +[2023-09-14 14:49:53,116][63734] Sum rewards: -3.988, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.469', 'AMMO5': '0.012', 'AMMO2': '0.036', 'ARMOR': '0.072', 'weapon5': '0.082', 'WEAPON4': '0.150', 'AMMO3': '0.158', 'weapon4': '0.172', 'AMMO4': '0.179', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.696', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.500', 'weapon2': '1.672', 'weapon3': '1.792'} +[2023-09-14 14:49:53,451][63732] Updated weights for policy 0, policy_version 1080 (0.0011) +[2023-09-14 14:49:53,829][63734] DAMAGECOUNT value on done: 5501.0 +[2023-09-14 14:49:53,829][63734] Sum rewards: -1.849, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.790', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.014', 'weapon4': '0.034', 'WEAPON5': '0.050', 'AMMO4': '0.068', 'AMMO3': '0.088', 'WEAPON4': '0.150', 'HITCOUNT': '0.240', 'ARMOR': '0.400', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.472', 'weapon3': '1.612'} +[2023-09-14 14:49:53,929][63805] DAMAGECOUNT value on done: 5314.0 +[2023-09-14 14:49:53,929][63805] Sum rewards: -0.089, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.352', 'AMMO2': '0.001', 'AMMO4': '0.007', 'AMMO5': '0.010', 'ARMOR': '0.064', 'weapon5': '0.130', 'AMMO3': '0.159', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.014', 'weapon3': '1.388', 'weapon2': '1.810', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:49:54,272][63734] DAMAGECOUNT value on done: 3567.0 +[2023-09-14 14:49:54,273][63734] Sum rewards: -5.465, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.410', 'weapon7': '0.006', 'AMMO2': '0.010', 'AMMO5': '0.013', 'weapon5': '0.016', 'AMMO4': '0.050', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.124', 'AMMO3': '0.175', 'WEAPON5': '0.200', 'HITCOUNT': '0.270', 'DAMAGECOUNT': '0.819', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.172', 'weapon3': '1.990'} +[2023-09-14 14:49:54,361][63805] DAMAGECOUNT value on done: 5433.0 +[2023-09-14 14:49:54,361][63805] Sum rewards: -4.144, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.416', 'AMMO5': '0.003', 'weapon5': '0.008', 'AMMO2': '0.021', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.102', 'AMMO3': '0.133', 'HITCOUNT': '0.150', 'weapon4': '0.192', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.146', 'weapon3': '1.742'} +[2023-09-14 14:49:54,915][63769] DAMAGECOUNT value on done: 5503.0 +[2023-09-14 14:49:54,915][63769] Sum rewards: -0.099, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.160', 'AMMO2': '0.010', 'AMMO5': '0.013', 'ARMOR': '0.032', 'AMMO4': '0.050', 'weapon5': '0.068', 'WEAPON4': '0.100', 'HITCOUNT': '0.160', 'AMMO3': '0.174', 'weapon4': '0.188', 'WEAPON5': '0.200', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.089', 'weapon3': '1.296', 'weapon2': '2.082', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:49:55,229][63769] DAMAGECOUNT value on done: 3178.0 +[2023-09-14 14:49:55,229][63769] Sum rewards: 1.073, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.950', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'ARMOR': '0.012', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'weapon5': '0.124', 'AMMO3': '0.196', 'WEAPON5': '0.200', 'HITCOUNT': '0.280', 'WEAPON3': '0.950', 'weapon2': '1.102', 'DAMAGECOUNT': '1.149', 'weapon3': '2.258', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:49:55,568][63771] DAMAGECOUNT value on done: 5244.0 +[2023-09-14 14:49:55,569][63771] Sum rewards: 0.717, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.036', 'AMMO4': '-0.032', 'AMMO2': '-0.006', 'AMMO5': '0.005', 'AMMO3': '0.091', 'ARMOR': '0.123', 'HITCOUNT': '0.180', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.768', 'weapon3': '1.748', 'FRAGCOUNT': '2.000', 'weapon2': '2.026'} +[2023-09-14 14:49:55,955][63771] DAMAGECOUNT value on done: 3572.0 +[2023-09-14 14:49:55,955][63771] Sum rewards: -2.285, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.558', 'AMMO2': '0.011', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'AMMO4': '0.056', 'AMMO3': '0.155', 'weapon4': '0.180', 'HITCOUNT': '0.220', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.930', 'weapon2': '1.288', 'weapon3': '1.596', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:49:57,746][63733] Updated weights for policy 1, policy_version 1100 (0.0011) +[2023-09-14 14:49:58,239][63769] DAMAGECOUNT value on done: 3750.0 +[2023-09-14 14:49:58,239][63769] Sum rewards: -5.332, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.410', 'ARMOR': '0.004', 'AMMO5': '0.015', 'AMMO2': '0.022', 'weapon5': '0.050', 'HITCOUNT': '0.080', 'AMMO4': '0.110', 'AMMO3': '0.126', 'weapon4': '0.136', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.321', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.266', 'weapon3': '1.998'} +[2023-09-14 14:49:58,693][63769] DAMAGECOUNT value on done: 5289.0 +[2023-09-14 14:49:58,693][63769] Sum rewards: -0.987, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.122', 'AMMO2': '0.003', 'AMMO4': '0.014', 'AMMO3': '0.101', 'WEAPON4': '0.150', 'HITCOUNT': '0.210', 'weapon4': '0.232', 'ARMOR': '0.521', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.600', 'weapon2': '1.434', 'weapon3': '1.520', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:50:00,012][63732] Updated weights for policy 0, policy_version 1090 (0.0011) +[2023-09-14 14:50:00,514][63770] DAMAGECOUNT value on done: 5920.0 +[2023-09-14 14:50:00,515][63770] Sum rewards: -1.643, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.610', 'AMMO5': '0.015', 'AMMO2': '0.023', 'HITCOUNT': '0.080', 'AMMO4': '0.113', 'AMMO3': '0.130', 'weapon5': '0.158', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'weapon4': '0.416', 'ARMOR': '0.476', 'DAMAGECOUNT': '0.585', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.134', 'weapon3': '1.236'} +[2023-09-14 14:50:00,611][63771] DAMAGECOUNT value on done: 2915.0 +[2023-09-14 14:50:00,611][63771] Sum rewards: 0.142, reward structure: {'DEATHCOUNT': '-5.250', 'weapon5': '0.010', 'AMMO2': '0.010', 'AMMO5': '0.012', 'ARMOR': '0.028', 'WEAPON4': '0.050', 'AMMO4': '0.051', 'AMMO3': '0.054', 'HITCOUNT': '0.120', 'WEAPON5': '0.150', 'weapon4': '0.164', 'HEALTH': '0.303', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.375', 'weapon3': '0.846', 'FRAGCOUNT': '1.000', 'weapon2': '1.868'} +[2023-09-14 14:50:00,909][63770] DAMAGECOUNT value on done: 3189.0 +[2023-09-14 14:50:00,960][63771] DAMAGECOUNT value on done: 4832.0 +[2023-09-14 14:50:01,809][63767] DAMAGECOUNT value on done: 5674.0 +[2023-09-14 14:50:01,809][63767] Sum rewards: -6.411, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.580', 'FRAGCOUNT': '-1.500', 'AMMO2': '0.000', 'AMMO4': '0.001', 'AMMO5': '0.005', 'weapon5': '0.056', 'HITCOUNT': '0.060', 'weapon4': '0.080', 'AMMO3': '0.091', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.120', 'WEAPON4': '0.150', 'ARMOR': '0.596', 'WEAPON3': '0.600', 'weapon3': '1.354', 'weapon2': '1.706'} +[2023-09-14 14:50:02,199][63767] DAMAGECOUNT value on done: 5998.0 +[2023-09-14 14:50:02,416][63767] DAMAGECOUNT value on done: 6512.0 +[2023-09-14 14:50:02,416][63767] Sum rewards: -6.084, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.962', 'AMMO5': '0.007', 'AMMO2': '0.008', 'ARMOR': '0.028', 'AMMO4': '0.037', 'WEAPON4': '0.050', 'weapon5': '0.072', 'weapon4': '0.096', 'WEAPON5': '0.100', 'AMMO3': '0.147', 'HITCOUNT': '0.160', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.996', 'FRAGCOUNT': '1.000', 'weapon3': '1.654', 'weapon2': '1.722'} +[2023-09-14 14:50:02,811][63767] DAMAGECOUNT value on done: 5935.0 +[2023-09-14 14:50:02,811][63767] Sum rewards: 2.530, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.120', 'AMMO4': '-0.068', 'AMMO2': '-0.013', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'weapon5': '0.098', 'WEAPON5': '0.100', 'AMMO3': '0.125', 'HITCOUNT': '0.310', 'WEAPON3': '0.700', 'weapon2': '1.292', 'DAMAGECOUNT': '1.443', 'weapon3': '1.866', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:50:02,855][63806] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:50:05,113][63735] DAMAGECOUNT value on done: 4858.0 +[2023-09-14 14:50:05,114][63735] Sum rewards: -4.463, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.503', 'AMMO5': '0.003', 'AMMO2': '0.006', 'WEAPON1': '0.010', 'AMMO4': '0.029', 'ARMOR': '0.048', 'WEAPON5': '0.050', 'AMMO3': '0.093', 'WEAPON4': '0.100', 'weapon4': '0.134', 'HITCOUNT': '0.150', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.600', 'weapon3': '1.498', 'weapon2': '1.500', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:50:05,528][63735] DAMAGECOUNT value on done: 4690.0 +[2023-09-14 14:50:05,528][63735] Sum rewards: -5.337, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.230', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'AMMO5': '0.005', 'ARMOR': '0.032', 'weapon5': '0.078', 'WEAPON4': '0.100', 'weapon7': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.130', 'AMMO3': '0.140', 'WEAPON5': '0.150', 'weapon4': '0.188', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.516', 'WEAPON3': '0.900', 'weapon2': '0.976', 'weapon3': '1.156'} +[2023-09-14 14:50:06,063][63733] Updated weights for policy 1, policy_version 1110 (0.0011) +[2023-09-14 14:50:06,496][63732] Updated weights for policy 0, policy_version 1100 (0.0010) +[2023-09-14 14:50:07,465][63454] Saving new best policy, reward=-2.430! +[2023-09-14 14:50:08,683][63805] DAMAGECOUNT value on done: 6481.0 +[2023-09-14 14:50:08,684][63805] Sum rewards: 2.327, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.410', 'AMMO2': '0.004', 'AMMO5': '0.007', 'AMMO4': '0.022', 'weapon5': '0.056', 'ARMOR': '0.092', 'WEAPON4': '0.100', 'AMMO3': '0.109', 'WEAPON5': '0.150', 'HITCOUNT': '0.240', 'weapon4': '0.326', 'WEAPON3': '0.550', 'weapon2': '0.856', 'DAMAGECOUNT': '1.386', 'weapon3': '1.588', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:50:09,014][63805] DAMAGECOUNT value on done: 4108.0 +[2023-09-14 14:50:10,720][63735] DAMAGECOUNT value on done: 4896.0 +[2023-09-14 14:50:10,720][63735] Sum rewards: -5.510, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.742', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'WEAPON1': '0.020', 'AMMO5': '0.025', 'ARMOR': '0.060', 'weapon5': '0.062', 'HITCOUNT': '0.170', 'AMMO3': '0.171', 'WEAPON5': '0.450', 'DAMAGECOUNT': '0.633', 'WEAPON3': '0.900', 'weapon3': '1.492', 'weapon2': '1.774'} +[2023-09-14 14:50:11,119][63735] DAMAGECOUNT value on done: 3113.0 +[2023-09-14 14:50:11,120][63735] Sum rewards: -6.159, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.528', 'AMMO2': '0.001', 'AMMO4': '0.005', 'ARMOR': '0.036', 'HITCOUNT': '0.150', 'AMMO3': '0.182', 'DAMAGECOUNT': '0.405', 'WEAPON3': '1.100', 'weapon2': '1.260', 'FRAGCOUNT': '2.000', 'weapon3': '2.230'} +[2023-09-14 14:50:12,068][63770] DAMAGECOUNT value on done: 4239.0 +[2023-09-14 14:50:12,145][63806] DAMAGECOUNT value on done: 4913.0 +[2023-09-14 14:50:12,145][63806] Sum rewards: -3.971, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.884', 'ARMOR': '0.008', 'AMMO5': '0.012', 'AMMO2': '0.014', 'weapon5': '0.042', 'weapon4': '0.048', 'WEAPON4': '0.050', 'AMMO4': '0.071', 'AMMO3': '0.116', 'WEAPON5': '0.250', 'HITCOUNT': '0.310', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.140', 'FRAGCOUNT': '1.500', 'weapon2': '1.580', 'weapon3': '1.872'} +[2023-09-14 14:50:12,462][63454] Saving new best policy, reward=-2.417! +[2023-09-14 14:50:12,468][63770] DAMAGECOUNT value on done: 4360.0 +[2023-09-14 14:50:12,469][63770] Sum rewards: 0.334, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.904', 'AMMO4': '-0.037', 'AMMO2': '-0.007', 'AMMO5': '0.015', 'ARMOR': '0.057', 'weapon5': '0.110', 'AMMO3': '0.131', 'HITCOUNT': '0.190', 'WEAPON5': '0.250', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.203', 'weapon2': '1.698', 'weapon3': '1.778', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:50:12,543][63806] DAMAGECOUNT value on done: 4863.0 +[2023-09-14 14:50:12,543][63806] Sum rewards: -5.032, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.446', 'AMMO5': '0.007', 'AMMO2': '0.011', 'weapon4': '0.044', 'weapon5': '0.048', 'WEAPON4': '0.050', 'AMMO4': '0.054', 'ARMOR': '0.064', 'WEAPON5': '0.150', 'AMMO3': '0.196', 'HITCOUNT': '0.360', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.434', 'FRAGCOUNT': '1.500', 'weapon2': '1.564', 'weapon3': '2.032'} +[2023-09-14 14:50:13,077][63732] Updated weights for policy 0, policy_version 1110 (0.0010) +[2023-09-14 14:50:14,487][63733] Updated weights for policy 1, policy_version 1120 (0.0011) +[2023-09-14 14:50:14,795][63806] DAMAGECOUNT value on done: 4266.0 +[2023-09-14 14:50:14,796][63806] Sum rewards: -7.925, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.758', 'AMMO2': '0.002', 'AMMO4': '0.011', 'weapon7': '0.030', 'ARMOR': '0.040', 'weapon4': '0.042', 'WEAPON4': '0.050', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.147', 'HITCOUNT': '0.220', 'DAMAGECOUNT': '0.825', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.606', 'weapon3': '1.610'} +[2023-09-14 14:50:15,190][63806] DAMAGECOUNT value on done: 6081.0 +[2023-09-14 14:50:15,191][63806] Sum rewards: -4.691, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.176', 'AMMO4': '-0.073', 'AMMO2': '-0.015', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'ARMOR': '0.036', 'weapon5': '0.108', 'HITCOUNT': '0.170', 'AMMO3': '0.172', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.498', 'WEAPON3': '0.550', 'weapon3': '1.420', 'FRAGCOUNT': '2.000', 'weapon2': '2.092'} +[2023-09-14 14:50:16,144][63734] DAMAGECOUNT value on done: 4493.0 +[2023-09-14 14:50:16,541][63734] DAMAGECOUNT value on done: 3746.0 +[2023-09-14 14:50:16,541][63734] Sum rewards: -4.930, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.440', 'AMMO5': '0.009', 'AMMO2': '0.022', 'weapon5': '0.070', 'ARMOR': '0.072', 'AMMO4': '0.108', 'HITCOUNT': '0.150', 'AMMO3': '0.165', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.432', 'WEAPON3': '0.850', 'weapon2': '1.746', 'weapon3': '1.936'} +[2023-09-14 14:50:18,347][63769] DAMAGECOUNT value on done: 5766.0 +[2023-09-14 14:50:18,347][63769] Sum rewards: -4.454, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.471', 'AMMO2': '0.009', 'AMMO5': '0.011', 'ARMOR': '0.028', 'AMMO4': '0.043', 'weapon5': '0.056', 'WEAPON4': '0.100', 'AMMO3': '0.137', 'WEAPON5': '0.150', 'weapon4': '0.172', 'HITCOUNT': '0.260', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.789', 'FRAGCOUNT': '1.000', 'weapon2': '1.574', 'weapon3': '1.688'} +[2023-09-14 14:50:18,689][63769] DAMAGECOUNT value on done: 3610.0 +[2023-09-14 14:50:18,689][63769] Sum rewards: -3.923, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.398', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'AMMO5': '0.017', 'AMMO3': '0.173', 'weapon5': '0.192', 'HITCOUNT': '0.290', 'WEAPON5': '0.400', 'WEAPON3': '0.700', 'weapon3': '1.164', 'DAMAGECOUNT': '1.296', 'FRAGCOUNT': '1.500', 'weapon2': '2.274'} +[2023-09-14 14:50:18,754][63734] DAMAGECOUNT value on done: 5653.0 +[2023-09-14 14:50:18,755][63734] Sum rewards: -4.154, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '0.000', 'weapon4': '0.028', 'AMMO2': '0.030', 'ARMOR': '0.048', 'weapon7': '0.086', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.110', 'AMMO4': '0.150', 'HITCOUNT': '0.150', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.456', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.452', 'weapon3': '1.736'} +[2023-09-14 14:50:19,097][63805] DAMAGECOUNT value on done: 5762.0 +[2023-09-14 14:50:19,097][63805] Sum rewards: -0.005, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.875', 'AMMO4': '-0.052', 'AMMO2': '-0.010', 'ARMOR': '0.008', 'WEAPON4': '0.050', 'weapon7': '0.088', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.146', 'weapon4': '0.168', 'WEAPON7': '0.200', 'HITCOUNT': '0.300', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.344', 'weapon3': '1.474', 'weapon2': '1.564', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:50:19,145][63734] DAMAGECOUNT value on done: 4052.0 +[2023-09-14 14:50:19,146][63734] Sum rewards: 4.076, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.275', 'AMMO4': '-0.000', 'AMMO2': '0.000', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'ARMOR': '0.032', 'AMMO3': '0.111', 'weapon5': '0.200', 'HITCOUNT': '0.270', 'WEAPON5': '0.300', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.455', 'weapon2': '1.632', 'weapon3': '1.674', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:50:19,458][63805] DAMAGECOUNT value on done: 5488.0 +[2023-09-14 14:50:19,637][63732] Updated weights for policy 0, policy_version 1120 (0.0011) +[2023-09-14 14:50:20,456][63771] DAMAGECOUNT value on done: 5417.0 +[2023-09-14 14:50:20,457][63771] Sum rewards: -3.530, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.025', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.009', 'WEAPON1': '0.030', 'ARMOR': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.124', 'HITCOUNT': '0.180', 'weapon5': '0.210', 'WEAPON5': '0.250', 'weapon4': '0.270', 'DAMAGECOUNT': '0.519', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.286', 'weapon3': '1.892'} +[2023-09-14 14:50:20,850][63771] DAMAGECOUNT value on done: 3792.0 +[2023-09-14 14:50:20,851][63771] Sum rewards: -6.214, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.988', 'AMMO4': '-0.038', 'AMMO2': '-0.008', 'AMMO5': '0.013', 'ARMOR': '0.020', 'weapon4': '0.032', 'weapon5': '0.064', 'WEAPON4': '0.100', 'AMMO3': '0.101', 'WEAPON5': '0.150', 'HITCOUNT': '0.180', 'DAMAGECOUNT': '0.660', 'WEAPON3': '0.700', 'weapon3': '1.484', 'weapon2': '1.816', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:50:22,533][63806] Large shaping reward -2.504 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.255, -85.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:50:22,907][63733] Updated weights for policy 1, policy_version 1130 (0.0010) +[2023-09-14 14:50:23,195][63769] DAMAGECOUNT value on done: 4105.0 +[2023-09-14 14:50:23,195][63769] Sum rewards: -4.053, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.594', 'AMMO5': '0.005', 'AMMO2': '0.013', 'weapon5': '0.024', 'ARMOR': '0.064', 'AMMO4': '0.065', 'WEAPON5': '0.100', 'AMMO3': '0.132', 'HITCOUNT': '0.290', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.065', 'weapon2': '1.438', 'weapon3': '1.996'} +[2023-09-14 14:50:23,422][63771] DAMAGECOUNT value on done: 2999.0 +[2023-09-14 14:50:23,591][63769] DAMAGECOUNT value on done: 5835.0 +[2023-09-14 14:50:23,592][63769] Sum rewards: 1.567, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.270', 'AMMO2': '0.004', 'ARMOR': '0.005', 'AMMO4': '0.022', 'AMMO3': '0.122', 'HITCOUNT': '0.390', 'WEAPON3': '0.650', 'weapon2': '1.540', 'DAMAGECOUNT': '1.638', 'weapon3': '1.716', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:50:23,817][63771] DAMAGECOUNT value on done: 4932.0 +[2023-09-14 14:50:23,817][63771] Sum rewards: -1.359, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.454', 'AMMO5': '0.003', 'AMMO2': '0.009', 'weapon5': '0.022', 'ARMOR': '0.044', 'AMMO4': '0.044', 'WEAPON5': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.077', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon2': '1.470', 'weapon3': '1.516'} +[2023-09-14 14:50:23,968][63767] DAMAGECOUNT value on done: 5931.0 +[2023-09-14 14:50:23,968][63767] Sum rewards: -4.164, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.105', 'AMMO2': '0.007', 'weapon4': '0.010', 'AMMO4': '0.033', 'ARMOR': '0.040', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'HITCOUNT': '0.170', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.771', 'FRAGCOUNT': '1.000', 'weapon3': '1.608', 'weapon2': '1.694'} +[2023-09-14 14:50:24,300][63767] DAMAGECOUNT value on done: 6138.0 +[2023-09-14 14:50:24,301][63767] Sum rewards: -6.098, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.264', 'AMMO2': '0.006', 'AMMO5': '0.012', 'weapon5': '0.018', 'AMMO4': '0.030', 'WEAPON4': '0.050', 'weapon7': '0.050', 'ARMOR': '0.068', 'HITCOUNT': '0.110', 'weapon4': '0.140', 'AMMO3': '0.151', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.338', 'weapon3': '1.702'} +[2023-09-14 14:50:25,303][63767] DAMAGECOUNT value on done: 6988.0 +[2023-09-14 14:50:25,304][63767] Sum rewards: 0.873, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.484', 'AMMO4': '-0.041', 'AMMO2': '-0.008', 'AMMO5': '0.011', 'ARMOR': '0.060', 'AMMO3': '0.155', 'weapon5': '0.158', 'HITCOUNT': '0.290', 'WEAPON5': '0.300', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.428', 'weapon3': '1.754', 'weapon2': '1.800', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:50:25,662][63770] DAMAGECOUNT value on done: 6053.0 +[2023-09-14 14:50:25,711][63767] DAMAGECOUNT value on done: 6497.0 +[2023-09-14 14:50:25,712][63767] Sum rewards: 2.412, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.350', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'AMMO5': '0.007', 'ARMOR': '0.040', 'weapon7': '0.064', 'weapon5': '0.090', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.121', 'WEAPON5': '0.150', 'weapon4': '0.154', 'WEAPON7': '0.200', 'HITCOUNT': '0.310', 'WEAPON3': '0.750', 'weapon2': '1.500', 'weapon3': '1.614', 'DAMAGECOUNT': '1.686', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:50:26,007][63770] DAMAGECOUNT value on done: 3338.0 +[2023-09-14 14:50:26,007][63770] Sum rewards: -3.488, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.118', 'AMMO4': '-0.004', 'AMMO2': '-0.001', 'WEAPON4': '0.050', 'HITCOUNT': '0.090', 'AMMO3': '0.101', 'DAMAGECOUNT': '0.447', 'ARMOR': '0.504', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.286', 'weapon2': '1.806'} +[2023-09-14 14:50:26,110][63732] Updated weights for policy 0, policy_version 1130 (0.0010) +[2023-09-14 14:50:27,466][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001135_4648960.pth... +[2023-09-14 14:50:27,467][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001132_4636672.pth... +[2023-09-14 14:50:27,521][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000799_3272704.pth +[2023-09-14 14:50:27,524][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000814_3334144.pth +[2023-09-14 14:50:27,529][63454] Saving new best policy, reward=-2.259! +[2023-09-14 14:50:29,926][63735] DAMAGECOUNT value on done: 5108.0 +[2023-09-14 14:50:29,927][63735] Sum rewards: -4.097, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.763', 'AMMO2': '0.021', 'weapon4': '0.054', 'ARMOR': '0.060', 'AMMO4': '0.103', 'AMMO3': '0.116', 'HITCOUNT': '0.150', 'WEAPON4': '0.200', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.750', 'weapon3': '1.516', 'weapon2': '1.596', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:50:30,334][63735] DAMAGECOUNT value on done: 5064.0 +[2023-09-14 14:50:30,334][63735] Sum rewards: 1.088, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.361', 'AMMO4': '-0.028', 'AMMO2': '-0.005', 'AMMO5': '0.008', 'AMMO3': '0.056', 'ARMOR': '0.064', 'weapon5': '0.086', 'weapon7': '0.102', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'WEAPON5': '0.200', 'HITCOUNT': '0.280', 'WEAPON3': '0.450', 'weapon3': '1.104', 'DAMAGECOUNT': '1.122', 'weapon2': '1.570', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:50:31,375][63733] Updated weights for policy 1, policy_version 1140 (0.0010) +[2023-09-14 14:50:32,461][63454] Saving new best policy, reward=-2.208! +[2023-09-14 14:50:32,679][63732] Updated weights for policy 0, policy_version 1140 (0.0010) +[2023-09-14 14:50:33,602][63805] DAMAGECOUNT value on done: 6681.0 +[2023-09-14 14:50:33,603][63805] Sum rewards: -0.317, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.086', 'AMMO2': '0.016', 'AMMO5': '0.022', 'AMMO4': '0.082', 'AMMO3': '0.083', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'weapon5': '0.184', 'WEAPON5': '0.350', 'weapon4': '0.402', 'ARMOR': '0.555', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.228', 'weapon3': '1.366'} +[2023-09-14 14:50:34,064][63805] DAMAGECOUNT value on done: 4203.0 +[2023-09-14 14:50:34,065][63805] Sum rewards: -3.477, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.004', 'AMMO4': '-0.043', 'AMMO2': '-0.009', 'AMMO5': '0.007', 'weapon5': '0.026', 'ARMOR': '0.028', 'WEAPON5': '0.050', 'HITCOUNT': '0.100', 'AMMO3': '0.127', 'weapon6': '0.128', 'AMMO6': '0.172', 'AMMO7': '0.172', 'WEAPON6': '0.200', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.388', 'weapon2': '1.744'} +[2023-09-14 14:50:35,115][63806] DAMAGECOUNT value on done: 5375.0 +[2023-09-14 14:50:35,115][63806] Sum rewards: 0.043, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.280', 'WEAPON1': '0.010', 'AMMO5': '0.018', 'AMMO2': '0.018', 'weapon5': '0.020', 'ARMOR': '0.080', 'AMMO4': '0.090', 'AMMO3': '0.123', 'WEAPON4': '0.150', 'weapon4': '0.214', 'WEAPON5': '0.250', 'HITCOUNT': '0.280', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.386', 'weapon3': '1.720', 'weapon2': '1.764'} +[2023-09-14 14:50:35,490][63735] DAMAGECOUNT value on done: 5333.0 +[2023-09-14 14:50:35,491][63735] Sum rewards: -1.875, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.710', 'AMMO4': '-0.076', 'AMMO2': '-0.015', 'AMMO5': '0.007', 'weapon5': '0.074', 'AMMO3': '0.160', 'WEAPON5': '0.200', 'HITCOUNT': '0.330', 'ARMOR': '0.495', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.311', 'weapon2': '1.522', 'weapon3': '1.926', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:50:35,502][63806] DAMAGECOUNT value on done: 5186.0 +[2023-09-14 14:50:35,502][63806] Sum rewards: -6.313, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-3.320', 'AMMO4': '-0.053', 'AMMO2': '-0.011', 'ARMOR': '0.014', 'AMMO5': '0.015', 'weapon5': '0.174', 'AMMO3': '0.196', 'HITCOUNT': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.969', 'WEAPON3': '1.200', 'weapon2': '1.542', 'weapon3': '1.710', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:50:35,883][63735] DAMAGECOUNT value on done: 3132.0 +[2023-09-14 14:50:35,884][63735] Sum rewards: -7.193, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.387', 'AMMO2': '0.021', 'HITCOUNT': '0.040', 'DAMAGECOUNT': '0.057', 'ARMOR': '0.064', 'AMMO4': '0.107', 'AMMO3': '0.125', 'WEAPON4': '0.300', 'weapon4': '0.310', 'WEAPON3': '0.550', 'weapon3': '0.892', 'FRAGCOUNT': '1.000', 'weapon2': '1.978'} +[2023-09-14 14:50:37,236][63770] DAMAGECOUNT value on done: 4579.0 +[2023-09-14 14:50:37,236][63770] Sum rewards: 3.938, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.426', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.011', 'weapon5': '0.050', 'ARMOR': '0.072', 'WEAPON5': '0.100', 'AMMO3': '0.115', 'HITCOUNT': '0.220', 'WEAPON4': '0.250', 'weapon4': '0.322', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.020', 'weapon2': '1.364', 'weapon3': '1.382', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:50:37,466][63454] Saving new best policy, reward=-2.119! +[2023-09-14 14:50:37,622][63770] DAMAGECOUNT value on done: 4410.0 +[2023-09-14 14:50:39,084][63806] DAMAGECOUNT value on done: 4369.0 +[2023-09-14 14:50:39,084][63806] Sum rewards: -3.943, reward structure: {'DEATHCOUNT': '-6.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.790', 'AMMO4': '-0.033', 'AMMO2': '-0.006', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'weapon5': '0.072', 'AMMO3': '0.090', 'HITCOUNT': '0.090', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.309', 'WEAPON3': '0.650', 'weapon2': '1.462', 'weapon3': '1.546'} +[2023-09-14 14:50:39,300][63732] Updated weights for policy 0, policy_version 1150 (0.0011) +[2023-09-14 14:50:39,492][63806] DAMAGECOUNT value on done: 6255.0 +[2023-09-14 14:50:39,493][63806] Sum rewards: -1.247, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.892', 'AMMO5': '0.005', 'AMMO2': '0.009', 'weapon5': '0.030', 'AMMO4': '0.043', 'ARMOR': '0.084', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.143', 'weapon4': '0.250', 'DAMAGECOUNT': '0.522', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.594', 'weapon3': '1.626'} +[2023-09-14 14:50:39,747][63733] Updated weights for policy 1, policy_version 1150 (0.0010) +[2023-09-14 14:50:39,926][63734] DAMAGECOUNT value on done: 4658.0 +[2023-09-14 14:50:40,261][63734] DAMAGECOUNT value on done: 4037.0 +[2023-09-14 14:50:40,262][63734] Sum rewards: -1.096, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.518', 'AMMO2': '0.006', 'WEAPON1': '0.010', 'weapon5': '0.012', 'AMMO5': '0.012', 'AMMO4': '0.032', 'WEAPON4': '0.100', 'ARMOR': '0.116', 'WEAPON5': '0.150', 'AMMO3': '0.168', 'weapon4': '0.206', 'HITCOUNT': '0.270', 'DAMAGECOUNT': '0.873', 'WEAPON3': '1.000', 'weapon2': '1.584', 'weapon3': '1.882', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:50:41,850][63769] DAMAGECOUNT value on done: 5973.0 +[2023-09-14 14:50:41,850][63769] Sum rewards: -4.961, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.640', 'AMMO2': '0.002', 'AMMO5': '0.010', 'AMMO4': '0.010', 'weapon7': '0.048', 'ARMOR': '0.056', 'weapon5': '0.084', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.150', 'AMMO3': '0.159', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.621', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.558', 'weapon2': '1.940'} +[2023-09-14 14:50:42,252][63769] DAMAGECOUNT value on done: 3835.0 +[2023-09-14 14:50:42,253][63769] Sum rewards: -7.450, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.240', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'AMMO5': '0.005', 'ARMOR': '0.024', 'weapon5': '0.042', 'WEAPON5': '0.050', 'HITCOUNT': '0.190', 'AMMO3': '0.210', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.466', 'weapon2': '2.230'} +[2023-09-14 14:50:44,079][63734] DAMAGECOUNT value on done: 6048.0 +[2023-09-14 14:50:44,080][63734] Sum rewards: -4.698, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.678', 'AMMO2': '0.008', 'AMMO4': '0.041', 'ARMOR': '0.088', 'WEAPON4': '0.150', 'AMMO3': '0.172', 'HITCOUNT': '0.280', 'weapon4': '0.304', 'WEAPON3': '1.100', 'weapon2': '1.126', 'DAMAGECOUNT': '1.185', 'weapon3': '1.776', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:50:44,092][63805] DAMAGECOUNT value on done: 6316.0 +[2023-09-14 14:50:44,093][63805] Sum rewards: 4.692, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.465', 'AMMO2': '0.005', 'AMMO5': '0.017', 'AMMO4': '0.026', 'ARMOR': '0.060', 'weapon4': '0.068', 'weapon7': '0.070', 'AMMO3': '0.096', 'WEAPON4': '0.100', 'weapon5': '0.112', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.320', 'WEAPON3': '0.550', 'weapon2': '1.544', 'weapon3': '1.636', 'DAMAGECOUNT': '1.662', 'FRAGCOUNT': '6.000'} +[2023-09-14 14:50:44,449][63734] DAMAGECOUNT value on done: 4706.0 +[2023-09-14 14:50:44,450][63734] Sum rewards: 0.500, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.890', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'AMMO3': '0.149', 'WEAPON5': '0.200', 'weapon5': '0.208', 'HITCOUNT': '0.390', 'WEAPON3': '0.700', 'weapon2': '1.220', 'DAMAGECOUNT': '1.941', 'weapon3': '2.060', 'FRAGCOUNT': '3.500'} +[2023-09-14 14:50:44,472][63805] DAMAGECOUNT value on done: 5643.0 +[2023-09-14 14:50:45,456][63771] DAMAGECOUNT value on done: 5692.0 +[2023-09-14 14:50:45,457][63771] Sum rewards: 3.454, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.010', 'AMMO2': '0.019', 'WEAPON1': '0.020', 'weapon7': '0.046', 'AMMO4': '0.094', 'weapon5': '0.098', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.106', 'WEAPON4': '0.150', 'HEALTH': '0.152', 'WEAPON5': '0.200', 'HITCOUNT': '0.240', 'weapon4': '0.502', 'ARMOR': '0.504', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.825', 'weapon2': '1.196', 'weapon3': '1.692', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:50:45,866][63771] DAMAGECOUNT value on done: 3807.0 +[2023-09-14 14:50:46,023][63732] Updated weights for policy 0, policy_version 1160 (0.0010) +[2023-09-14 14:50:46,204][63771] DAMAGECOUNT value on done: 3263.0 +[2023-09-14 14:50:46,204][63771] Sum rewards: -0.519, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.582', 'AMMO2': '0.016', 'ARMOR': '0.056', 'AMMO4': '0.081', 'AMMO3': '0.141', 'WEAPON4': '0.200', 'HITCOUNT': '0.240', 'weapon4': '0.242', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.792', 'weapon3': '1.408', 'weapon2': '1.636', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:50:46,349][63767] DAMAGECOUNT value on done: 6172.0 +[2023-09-14 14:50:46,350][63767] Sum rewards: -3.571, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.057', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'weapon5': '0.034', 'ARMOR': '0.064', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.132', 'AMMO3': '0.133', 'HITCOUNT': '0.230', 'DAMAGECOUNT': '0.723', 'WEAPON3': '0.900', 'weapon2': '1.248', 'weapon3': '1.810', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:50:46,588][63771] DAMAGECOUNT value on done: 5147.0 +[2023-09-14 14:50:46,589][63771] Sum rewards: -4.515, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.130', 'AMMO2': '0.002', 'AMMO5': '0.003', 'AMMO4': '0.011', 'weapon5': '0.026', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'AMMO3': '0.180', 'HITCOUNT': '0.180', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.800', 'weapon3': '1.112', 'FRAGCOUNT': '2.000', 'weapon2': '2.066'} +[2023-09-14 14:50:46,739][63767] DAMAGECOUNT value on done: 6213.0 +[2023-09-14 14:50:48,384][63733] Updated weights for policy 1, policy_version 1160 (0.0011) +[2023-09-14 14:50:48,443][63769] DAMAGECOUNT value on done: 4265.0 +[2023-09-14 14:50:48,675][63767] DAMAGECOUNT value on done: 7293.0 +[2023-09-14 14:50:48,676][63767] Sum rewards: 1.155, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.044', 'AMMO2': '0.010', 'AMMO5': '0.012', 'ARMOR': '0.026', 'AMMO4': '0.048', 'weapon5': '0.070', 'WEAPON4': '0.100', 'weapon4': '0.100', 'AMMO3': '0.146', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.915', 'weapon3': '1.562', 'weapon2': '1.850', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:50:48,842][63769] DAMAGECOUNT value on done: 6055.0 +[2023-09-14 14:50:48,843][63769] Sum rewards: -0.719, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.064', 'AMMO4': '-0.046', 'AMMO2': '-0.009', 'ARMOR': '0.008', 'AMMO3': '0.096', 'HITCOUNT': '0.140', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.660', 'FRAGCOUNT': '1.000', 'weapon3': '1.528', 'weapon2': '1.568'} +[2023-09-14 14:50:49,022][63767] DAMAGECOUNT value on done: 6907.0 +[2023-09-14 14:50:49,022][63767] Sum rewards: -1.736, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.995', 'AMMO5': '0.012', 'AMMO2': '0.013', 'WEAPON1': '0.020', 'weapon4': '0.042', 'AMMO4': '0.067', 'WEAPON4': '0.100', 'weapon5': '0.130', 'AMMO3': '0.192', 'HITCOUNT': '0.230', 'WEAPON5': '0.250', 'ARMOR': '0.432', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.230', 'weapon2': '1.536', 'weapon3': '1.954', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:50:51,292][63770] DAMAGECOUNT value on done: 6291.0 +[2023-09-14 14:50:51,292][63770] Sum rewards: -4.350, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.940', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.018', 'AMMO5': '0.019', 'WEAPON1': '0.030', 'AMMO4': '0.089', 'AMMO3': '0.138', 'weapon5': '0.184', 'HITCOUNT': '0.190', 'WEAPON5': '0.300', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.714', 'weapon2': '1.484', 'weapon3': '1.524'} +[2023-09-14 14:50:51,696][63770] DAMAGECOUNT value on done: 3533.0 +[2023-09-14 14:50:51,696][63770] Sum rewards: -5.572, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.203', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'AMMO5': '0.003', 'weapon4': '0.012', 'WEAPON4': '0.050', 'ARMOR': '0.060', 'AMMO3': '0.163', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.585', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.592', 'weapon3': '1.766'} +[2023-09-14 14:50:52,462][63576] Saving new best policy, reward=-4.354! +[2023-09-14 14:50:52,835][63732] Updated weights for policy 0, policy_version 1170 (0.0012) +[2023-09-14 14:50:55,246][63735] DAMAGECOUNT value on done: 5423.0 +[2023-09-14 14:50:55,246][63735] Sum rewards: -2.931, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.240', 'AMMO2': '0.009', 'ARMOR': '0.044', 'AMMO4': '0.046', 'AMMO3': '0.120', 'weapon4': '0.164', 'WEAPON4': '0.200', 'HITCOUNT': '0.270', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.945', 'FRAGCOUNT': '1.000', 'weapon2': '1.492', 'weapon3': '1.668'} +[2023-09-14 14:50:55,688][63735] DAMAGECOUNT value on done: 5436.0 +[2023-09-14 14:50:55,689][63735] Sum rewards: -2.599, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.558', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.010', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'AMMO4': '0.049', 'AMMO3': '0.123', 'HITCOUNT': '0.230', 'WEAPON5': '0.300', 'weapon5': '0.324', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.116', 'weapon3': '1.434', 'weapon2': '1.600'} +[2023-09-14 14:50:57,261][63733] Updated weights for policy 1, policy_version 1170 (0.0012) +[2023-09-14 14:50:58,978][63806] DAMAGECOUNT value on done: 5402.0 +[2023-09-14 14:50:59,083][63805] DAMAGECOUNT value on done: 6971.0 +[2023-09-14 14:50:59,084][63805] Sum rewards: -1.655, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.704', 'AMMO2': '0.007', 'AMMO5': '0.013', 'AMMO4': '0.033', 'weapon7': '0.064', 'ARMOR': '0.088', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.100', 'weapon5': '0.102', 'AMMO3': '0.136', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'HITCOUNT': '0.290', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.870', 'FRAGCOUNT': '1.000', 'weapon2': '1.252', 'weapon3': '1.874'} +[2023-09-14 14:50:59,319][63806] DAMAGECOUNT value on done: 5288.0 +[2023-09-14 14:50:59,320][63806] Sum rewards: -0.461, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.762', 'AMMO2': '0.005', 'AMMO5': '0.005', 'weapon5': '0.016', 'AMMO4': '0.024', 'WEAPON1': '0.030', 'WEAPON5': '0.100', 'AMMO3': '0.117', 'HITCOUNT': '0.140', 'DAMAGECOUNT': '0.306', 'ARMOR': '0.564', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.098', 'weapon3': '1.496'} +[2023-09-14 14:50:59,436][63805] DAMAGECOUNT value on done: 4338.0 +[2023-09-14 14:50:59,437][63805] Sum rewards: -5.589, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.110', 'AMMO2': '0.003', 'AMMO4': '0.014', 'ARMOR': '0.028', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.138', 'AMMO3': '0.159', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.900', 'weapon2': '1.306', 'weapon3': '1.618', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:50:59,596][63732] Updated weights for policy 0, policy_version 1180 (0.0011) +[2023-09-14 14:51:00,702][63735] DAMAGECOUNT value on done: 5398.0 +[2023-09-14 14:51:01,105][63735] DAMAGECOUNT value on done: 3475.0 +[2023-09-14 14:51:01,106][63735] Sum rewards: -1.493, reward structure: {'DEATHCOUNT': '-9.750', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'ARMOR': '0.028', 'weapon5': '0.032', 'weapon4': '0.036', 'WEAPON4': '0.050', 'HEALTH': '0.070', 'AMMO4': '0.086', 'WEAPON5': '0.100', 'AMMO3': '0.122', 'HITCOUNT': '0.250', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.029', 'weapon3': '1.544', 'weapon2': '1.728', 'FRAGCOUNT': '2.500'} +[2023-09-14 14:51:03,070][63770] DAMAGECOUNT value on done: 4704.0 +[2023-09-14 14:51:03,472][63770] DAMAGECOUNT value on done: 4455.0 +[2023-09-14 14:51:03,473][63770] Sum rewards: -9.683, reward structure: {'DEATHCOUNT': '-11.250', 'FRAGCOUNT': '-3.000', 'HEALTH': '-0.188', 'weapon4': '0.002', 'WEAPON1': '0.010', 'AMMO2': '0.013', 'AMMO5': '0.014', 'ARMOR': '0.028', 'HITCOUNT': '0.050', 'AMMO4': '0.062', 'weapon5': '0.096', 'WEAPON4': '0.100', 'AMMO3': '0.119', 'DAMAGECOUNT': '0.135', 'WEAPON5': '0.200', 'WEAPON3': '0.700', 'weapon3': '1.446', 'weapon2': '1.780'} +[2023-09-14 14:51:04,418][63734] DAMAGECOUNT value on done: 4851.0 +[2023-09-14 14:51:04,419][63734] Sum rewards: -6.789, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.880', 'AMMO2': '0.002', 'AMMO4': '0.011', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'WEAPON4': '0.100', 'AMMO3': '0.132', 'weapon4': '0.134', 'weapon5': '0.154', 'HITCOUNT': '0.200', 'WEAPON5': '0.250', 'ARMOR': '0.490', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.579', 'WEAPON3': '0.600', 'weapon2': '1.404', 'weapon3': '1.752'} +[2023-09-14 14:51:04,433][63806] DAMAGECOUNT value on done: 4569.0 +[2023-09-14 14:51:04,434][63806] Sum rewards: -6.874, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.506', 'AMMO5': '0.005', 'AMMO2': '0.008', 'ARMOR': '0.010', 'weapon5': '0.016', 'AMMO4': '0.042', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'weapon4': '0.138', 'HITCOUNT': '0.150', 'AMMO3': '0.159', 'DAMAGECOUNT': '0.600', 'WEAPON3': '1.000', 'weapon2': '1.602', 'weapon3': '1.752', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:04,769][63734] DAMAGECOUNT value on done: 4194.0 +[2023-09-14 14:51:04,769][63734] Sum rewards: -7.217, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.452', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.005', 'AMMO5': '0.013', 'AMMO4': '0.025', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'weapon4': '0.118', 'HITCOUNT': '0.150', 'AMMO3': '0.180', 'weapon5': '0.198', 'WEAPON5': '0.300', 'ARMOR': '0.466', 'DAMAGECOUNT': '0.471', 'WEAPON3': '0.800', 'weapon3': '1.572', 'weapon2': '1.596'} +[2023-09-14 14:51:04,852][63806] DAMAGECOUNT value on done: 6520.0 +[2023-09-14 14:51:04,853][63806] Sum rewards: -3.402, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.786', 'AMMO5': '0.007', 'AMMO2': '0.019', 'WEAPON1': '0.020', 'ARMOR': '0.044', 'WEAPON4': '0.050', 'HITCOUNT': '0.060', 'AMMO4': '0.097', 'WEAPON5': '0.150', 'AMMO3': '0.156', 'weapon4': '0.162', 'weapon5': '0.272', 'DAMAGECOUNT': '0.795', 'WEAPON3': '0.800', 'weapon2': '1.312', 'FRAGCOUNT': '1.500', 'weapon3': '1.690'} +[2023-09-14 14:51:05,672][63733] Updated weights for policy 1, policy_version 1180 (0.0011) +[2023-09-14 14:51:06,148][63732] Updated weights for policy 0, policy_version 1190 (0.0010) +[2023-09-14 14:51:06,152][63769] DAMAGECOUNT value on done: 6293.0 +[2023-09-14 14:51:06,152][63769] Sum rewards: 0.424, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.450', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.020', 'ARMOR': '0.032', 'weapon5': '0.044', 'WEAPON4': '0.050', 'weapon7': '0.080', 'AMMO6': '0.100', 'AMMO7': '0.100', 'HITCOUNT': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.140', 'weapon4': '0.198', 'WEAPON5': '0.400', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.960', 'weapon2': '1.322', 'weapon3': '1.824', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:51:06,492][63769] DAMAGECOUNT value on done: 4266.0 +[2023-09-14 14:51:06,493][63769] Sum rewards: 0.015, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.463', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'WEAPON4': '0.050', 'ARMOR': '0.076', 'weapon4': '0.106', 'AMMO3': '0.142', 'HITCOUNT': '0.300', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.293', 'weapon2': '1.528', 'weapon3': '1.690', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:51:08,962][63767] DAMAGECOUNT value on done: 6465.0 +[2023-09-14 14:51:08,963][63767] Sum rewards: -1.232, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.330', 'AMMO4': '-0.040', 'AMMO2': '-0.008', 'AMMO5': '0.012', 'weapon5': '0.052', 'AMMO3': '0.099', 'WEAPON5': '0.150', 'HITCOUNT': '0.220', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.879', 'weapon3': '1.138', 'weapon2': '1.796', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:09,346][63767] DAMAGECOUNT value on done: 6228.0 +[2023-09-14 14:51:09,521][63805] DAMAGECOUNT value on done: 6500.0 +[2023-09-14 14:51:09,522][63805] Sum rewards: 0.257, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.038', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.015', 'weapon7': '0.070', 'AMMO4': '0.073', 'weapon5': '0.076', 'AMMO3': '0.106', 'HITCOUNT': '0.140', 'WEAPON4': '0.250', 'WEAPON5': '0.250', 'AMMO6': '0.320', 'AMMO7': '0.320', 'weapon4': '0.340', 'WEAPON7': '0.400', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.552', 'FRAGCOUNT': '1.000', 'weapon3': '1.272', 'weapon2': '1.588'} +[2023-09-14 14:51:09,687][63771] DAMAGECOUNT value on done: 3413.0 +[2023-09-14 14:51:09,687][63771] Sum rewards: -5.030, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.038', 'AMMO2': '0.016', 'ARMOR': '0.028', 'AMMO4': '0.079', 'AMMO3': '0.131', 'HITCOUNT': '0.140', 'WEAPON4': '0.300', 'weapon4': '0.328', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.850', 'weapon3': '1.396', 'weapon2': '1.790', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:09,875][63805] DAMAGECOUNT value on done: 5861.0 +[2023-09-14 14:51:09,876][63805] Sum rewards: -2.412, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.946', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.016', 'WEAPON5': '0.050', 'AMMO4': '0.081', 'AMMO3': '0.084', 'WEAPON4': '0.100', 'HITCOUNT': '0.200', 'weapon4': '0.308', 'ARMOR': '0.448', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.654', 'weapon3': '1.288', 'weapon2': '1.540', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:51:10,071][63771] DAMAGECOUNT value on done: 5401.0 +[2023-09-14 14:51:10,071][63771] Sum rewards: -3.258, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.025', 'AMMO4': '-0.051', 'AMMO2': '-0.010', 'weapon4': '0.042', 'ARMOR': '0.072', 'AMMO3': '0.096', 'WEAPON4': '0.100', 'HITCOUNT': '0.260', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.762', 'weapon3': '1.296', 'weapon2': '1.850', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:10,148][63734] DAMAGECOUNT value on done: 6348.0 +[2023-09-14 14:51:10,149][63734] Sum rewards: -0.885, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.848', 'AMMO2': '0.001', 'AMMO5': '0.003', 'AMMO4': '0.003', 'weapon5': '0.040', 'WEAPON5': '0.050', 'AMMO3': '0.088', 'HITCOUNT': '0.240', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.900', 'weapon3': '1.154', 'weapon2': '1.734', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:10,475][63734] DAMAGECOUNT value on done: 4832.0 +[2023-09-14 14:51:10,475][63734] Sum rewards: -8.858, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-3.000', 'HEALTH': '-1.488', 'AMMO4': '-0.020', 'AMMO2': '-0.004', 'AMMO5': '0.017', 'ARMOR': '0.060', 'HITCOUNT': '0.130', 'weapon5': '0.166', 'AMMO3': '0.176', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.378', 'WEAPON3': '1.050', 'weapon2': '1.468', 'weapon3': '1.708'} +[2023-09-14 14:51:11,288][63771] DAMAGECOUNT value on done: 6233.0 +[2023-09-14 14:51:11,288][63771] Sum rewards: -1.610, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.598', 'AMMO4': '-0.029', 'AMMO2': '-0.006', 'AMMO5': '0.009', 'WEAPON1': '0.030', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.100', 'AMMO3': '0.127', 'weapon5': '0.176', 'WEAPON5': '0.200', 'HITCOUNT': '0.360', 'WEAPON3': '0.800', 'weapon2': '1.320', 'DAMAGECOUNT': '1.623', 'weapon3': '1.728', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:11,753][63771] DAMAGECOUNT value on done: 4342.0 +[2023-09-14 14:51:11,753][63771] Sum rewards: -1.453, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.654', 'AMMO5': '0.005', 'AMMO2': '0.009', 'WEAPON1': '0.020', 'AMMO4': '0.045', 'WEAPON5': '0.050', 'AMMO3': '0.127', 'HITCOUNT': '0.380', 'WEAPON3': '0.750', 'weapon3': '1.446', 'weapon2': '1.514', 'DAMAGECOUNT': '1.605', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:51:11,995][63767] DAMAGECOUNT value on done: 7426.0 +[2023-09-14 14:51:11,995][63767] Sum rewards: -4.387, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.690', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.007', 'weapon5': '0.008', 'AMMO2': '0.011', 'AMMO4': '0.054', 'AMMO3': '0.110', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'weapon4': '0.340', 'DAMAGECOUNT': '0.399', 'WEAPON3': '0.650', 'weapon3': '1.200', 'weapon2': '1.834'} +[2023-09-14 14:51:12,388][63767] DAMAGECOUNT value on done: 7120.0 +[2023-09-14 14:51:12,388][63767] Sum rewards: -4.365, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.280', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.017', 'ARMOR': '0.040', 'WEAPON1': '0.040', 'weapon5': '0.080', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON4': '0.100', 'weapon7': '0.128', 'AMMO3': '0.157', 'HITCOUNT': '0.160', 'weapon4': '0.326', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.639', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.124', 'weapon2': '1.564'} +[2023-09-14 14:51:12,462][63576] Saving new best policy, reward=-4.307! +[2023-09-14 14:51:12,806][63732] Updated weights for policy 0, policy_version 1200 (0.0012) +[2023-09-14 14:51:14,298][63769] DAMAGECOUNT value on done: 4369.0 +[2023-09-14 14:51:14,298][63769] Sum rewards: -2.275, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.842', 'AMMO5': '0.007', 'weapon7': '0.012', 'AMMO2': '0.016', 'WEAPON1': '0.030', 'weapon5': '0.076', 'AMMO4': '0.078', 'ARMOR': '0.080', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.145', 'WEAPON5': '0.150', 'weapon4': '0.178', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'DAMAGECOUNT': '0.312', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.260', 'weapon2': '1.962'} +[2023-09-14 14:51:14,305][63733] Updated weights for policy 1, policy_version 1190 (0.0012) +[2023-09-14 14:51:14,636][63769] DAMAGECOUNT value on done: 6170.0 +[2023-09-14 14:51:14,636][63769] Sum rewards: -5.294, reward structure: {'DEATHCOUNT': '-11.250', 'AMMO2': '0.008', 'AMMO4': '0.041', 'WEAPON4': '0.050', 'HITCOUNT': '0.080', 'HEALTH': '0.138', 'AMMO3': '0.158', 'DAMAGECOUNT': '0.345', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.624', 'weapon2': '1.762'} +[2023-09-14 14:51:17,059][63770] DAMAGECOUNT value on done: 6541.0 +[2023-09-14 14:51:17,060][63770] Sum rewards: -2.261, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.729', 'AMMO5': '0.013', 'AMMO2': '0.015', 'ARMOR': '0.028', 'weapon5': '0.038', 'AMMO4': '0.074', 'weapon7': '0.092', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.105', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.380', 'weapon2': '1.954'} +[2023-09-14 14:51:17,464][63770] DAMAGECOUNT value on done: 3838.0 +[2023-09-14 14:51:17,465][63770] Sum rewards: -2.496, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.030', 'weapon5': '0.004', 'ARMOR': '0.004', 'AMMO2': '0.004', 'AMMO5': '0.013', 'AMMO4': '0.022', 'weapon4': '0.082', 'WEAPON4': '0.100', 'AMMO3': '0.116', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.915', 'weapon2': '1.336', 'weapon3': '1.778', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:19,569][63732] Updated weights for policy 0, policy_version 1210 (0.0010) +[2023-09-14 14:51:20,250][63735] DAMAGECOUNT value on done: 5528.0 +[2023-09-14 14:51:20,251][63735] Sum rewards: -4.315, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.753', 'AMMO2': '0.007', 'AMMO4': '0.035', 'WEAPON4': '0.050', 'weapon4': '0.060', 'HITCOUNT': '0.080', 'AMMO3': '0.161', 'DAMAGECOUNT': '0.315', 'ARMOR': '0.472', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.288', 'weapon3': '2.020'} +[2023-09-14 14:51:20,565][63735] DAMAGECOUNT value on done: 5573.0 +[2023-09-14 14:51:20,565][63735] Sum rewards: -3.093, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.706', 'AMMO2': '0.005', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.026', 'WEAPON4': '0.050', 'weapon5': '0.054', 'AMMO3': '0.121', 'HITCOUNT': '0.160', 'weapon4': '0.160', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.411', 'WEAPON3': '0.600', 'ARMOR': '0.851', 'weapon2': '1.416', 'weapon3': '1.774'} +[2023-09-14 14:51:22,236][63806] DAMAGECOUNT value on done: 5586.0 +[2023-09-14 14:51:22,237][63806] Sum rewards: -7.161, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.528', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO2': '0.023', 'weapon5': '0.034', 'AMMO4': '0.112', 'weapon4': '0.126', 'HITCOUNT': '0.170', 'AMMO3': '0.182', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'ARMOR': '0.412', 'DAMAGECOUNT': '0.552', 'WEAPON3': '1.000', 'weapon2': '1.290', 'weapon3': '1.734'} +[2023-09-14 14:51:22,462][63576] Saving new best policy, reward=-4.299! +[2023-09-14 14:51:22,558][63806] DAMAGECOUNT value on done: 5456.0 +[2023-09-14 14:51:22,558][63806] Sum rewards: -1.461, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.410', 'AMMO5': '0.012', 'AMMO2': '0.014', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO4': '0.069', 'AMMO3': '0.121', 'HITCOUNT': '0.170', 'weapon4': '0.186', 'weapon5': '0.224', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.504', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.264', 'weapon3': '1.820'} +[2023-09-14 14:51:22,777][63733] Updated weights for policy 1, policy_version 1200 (0.0010) +[2023-09-14 14:51:24,141][63805] DAMAGECOUNT value on done: 7265.0 +[2023-09-14 14:51:24,141][63805] Sum rewards: -2.931, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.008', 'AMMO5': '0.012', 'HEALTH': '0.018', 'ARMOR': '0.028', 'AMMO4': '0.038', 'weapon5': '0.108', 'AMMO3': '0.142', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.882', 'weapon2': '1.346', 'weapon3': '2.136'} +[2023-09-14 14:51:24,546][63805] DAMAGECOUNT value on done: 4387.0 +[2023-09-14 14:51:25,692][63735] DAMAGECOUNT value on done: 5912.0 +[2023-09-14 14:51:25,692][63735] Sum rewards: -4.367, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-3.060', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'AMMO3': '0.135', 'weapon4': '0.180', 'HITCOUNT': '0.200', 'weapon5': '0.238', 'WEAPON5': '0.300', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.113', 'weapon2': '1.258', 'FRAGCOUNT': '1.500', 'weapon3': '1.768'} +[2023-09-14 14:51:26,031][63732] Updated weights for policy 0, policy_version 1220 (0.0012) +[2023-09-14 14:51:26,091][63735] DAMAGECOUNT value on done: 3641.0 +[2023-09-14 14:51:26,091][63735] Sum rewards: -1.231, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.110', 'AMMO4': '-0.072', 'AMMO2': '-0.014', 'AMMO5': '0.012', 'weapon5': '0.060', 'AMMO3': '0.092', 'HITCOUNT': '0.100', 'WEAPON5': '0.150', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.498', 'weapon3': '1.098', 'weapon2': '1.504', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:27,468][63576] Saving new best policy, reward=-4.296! +[2023-09-14 14:51:28,209][63734] DAMAGECOUNT value on done: 5131.0 +[2023-09-14 14:51:28,210][63734] Sum rewards: -4.008, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.270', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'weapon5': '0.026', 'ARMOR': '0.028', 'WEAPON4': '0.050', 'AMMO4': '0.083', 'WEAPON5': '0.100', 'AMMO3': '0.109', 'weapon4': '0.194', 'HITCOUNT': '0.270', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.840', 'weapon2': '1.356', 'weapon3': '1.822'} +[2023-09-14 14:51:28,571][63734] DAMAGECOUNT value on done: 4414.0 +[2023-09-14 14:51:28,572][63734] Sum rewards: -4.895, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.712', 'AMMO2': '0.019', 'WEAPON1': '0.020', 'AMMO4': '0.092', 'AMMO3': '0.154', 'HITCOUNT': '0.200', 'WEAPON4': '0.300', 'ARMOR': '0.480', 'weapon4': '0.654', 'DAMAGECOUNT': '0.660', 'WEAPON3': '0.850', 'weapon2': '1.408', 'weapon3': '1.480', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:28,766][63770] DAMAGECOUNT value on done: 4808.0 +[2023-09-14 14:51:29,110][63770] DAMAGECOUNT value on done: 4814.0 +[2023-09-14 14:51:29,110][63770] Sum rewards: -1.928, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.320', 'AMMO5': '0.016', 'AMMO2': '0.017', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.087', 'weapon4': '0.088', 'AMMO3': '0.157', 'HITCOUNT': '0.180', 'weapon5': '0.282', 'WEAPON5': '0.300', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.077', 'weapon3': '1.290', 'weapon2': '1.778', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:51:29,237][63806] DAMAGECOUNT value on done: 4598.0 +[2023-09-14 14:51:29,679][63806] DAMAGECOUNT value on done: 6774.0 +[2023-09-14 14:51:29,679][63806] Sum rewards: -1.113, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.345', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.003', 'ARMOR': '0.068', 'weapon7': '0.074', 'AMMO3': '0.077', 'weapon5': '0.090', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.110', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.160', 'WEAPON7': '0.200', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.762', 'FRAGCOUNT': '1.000', 'weapon3': '1.036', 'weapon2': '1.658'} +[2023-09-14 14:51:30,149][63769] DAMAGECOUNT value on done: 6398.0 +[2023-09-14 14:51:30,149][63769] Sum rewards: -10.214, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.666', 'FRAGCOUNT': '-1.500', 'AMMO2': '0.009', 'weapon4': '0.014', 'AMMO5': '0.023', 'ARMOR': '0.028', 'AMMO4': '0.044', 'WEAPON4': '0.100', 'weapon5': '0.134', 'HITCOUNT': '0.140', 'AMMO3': '0.223', 'DAMAGECOUNT': '0.315', 'WEAPON5': '0.350', 'WEAPON3': '1.150', 'weapon2': '1.266', 'weapon3': '2.156'} +[2023-09-14 14:51:30,513][63769] DAMAGECOUNT value on done: 4374.0 +[2023-09-14 14:51:30,513][63769] Sum rewards: -3.977, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'ARMOR': '0.016', 'AMMO5': '0.016', 'AMMO4': '0.035', 'WEAPON4': '0.050', 'weapon5': '0.076', 'AMMO3': '0.110', 'HITCOUNT': '0.120', 'weapon4': '0.148', 'HEALTH': '0.174', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.324', 'WEAPON3': '0.450', 'weapon2': '1.438', 'weapon3': '1.798'} +[2023-09-14 14:51:31,225][63733] Updated weights for policy 1, policy_version 1210 (0.0011) +[2023-09-14 14:51:31,593][63767] DAMAGECOUNT value on done: 6590.0 +[2023-09-14 14:51:31,594][63767] Sum rewards: -2.416, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.695', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.001', 'AMMO5': '0.003', 'AMMO4': '0.005', 'WEAPON1': '0.030', 'WEAPON5': '0.050', 'weapon5': '0.060', 'AMMO3': '0.110', 'HITCOUNT': '0.140', 'DAMAGECOUNT': '0.375', 'ARMOR': '0.447', 'WEAPON3': '0.500', 'weapon2': '1.498', 'weapon3': '1.560'} +[2023-09-14 14:51:31,943][63767] DAMAGECOUNT value on done: 6403.0 +[2023-09-14 14:51:31,944][63767] Sum rewards: -5.558, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.955', 'AMMO2': '0.003', 'AMMO5': '0.008', 'WEAPON1': '0.010', 'AMMO4': '0.013', 'weapon5': '0.016', 'ARMOR': '0.020', 'AMMO3': '0.096', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.160', 'weapon4': '0.206', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.525', 'weapon3': '1.378', 'weapon2': '1.512'} +[2023-09-14 14:51:32,460][63771] DAMAGECOUNT value on done: 3470.0 +[2023-09-14 14:51:32,460][63771] Sum rewards: -4.938, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.316', 'AMMO4': '-0.033', 'AMMO2': '-0.007', 'AMMO5': '0.005', 'weapon5': '0.008', 'ARMOR': '0.024', 'HITCOUNT': '0.060', 'WEAPON5': '0.100', 'AMMO3': '0.133', 'DAMAGECOUNT': '0.171', 'weapon2': '0.766', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '2.400'} +[2023-09-14 14:51:32,462][63576] Saving new best policy, reward=-4.221! +[2023-09-14 14:51:32,725][63732] Updated weights for policy 0, policy_version 1230 (0.0011) +[2023-09-14 14:51:32,771][63771] DAMAGECOUNT value on done: 5621.0 +[2023-09-14 14:51:32,772][63771] Sum rewards: -4.839, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.130', 'AMMO5': '0.003', 'AMMO2': '0.025', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'weapon4': '0.084', 'weapon5': '0.086', 'WEAPON4': '0.100', 'AMMO4': '0.123', 'AMMO3': '0.128', 'HITCOUNT': '0.200', 'DAMAGECOUNT': '0.660', 'WEAPON3': '0.900', 'weapon2': '1.524', 'weapon3': '1.864', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:34,660][63805] DAMAGECOUNT value on done: 6787.0 +[2023-09-14 14:51:34,661][63805] Sum rewards: 2.588, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.062', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'weapon7': '0.002', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO3': '0.073', 'weapon5': '0.122', 'HITCOUNT': '0.190', 'WEAPON4': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.350', 'weapon4': '0.442', 'ARMOR': '0.519', 'DAMAGECOUNT': '0.861', 'weapon3': '1.058', 'weapon2': '1.662', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:51:34,999][63805] DAMAGECOUNT value on done: 5951.0 +[2023-09-14 14:51:34,999][63805] Sum rewards: -4.068, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.448', 'AMMO5': '0.005', 'AMMO2': '0.015', 'WEAPON4': '0.050', 'AMMO4': '0.073', 'HITCOUNT': '0.080', 'weapon4': '0.104', 'AMMO3': '0.135', 'DAMAGECOUNT': '0.270', 'ARMOR': '0.472', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.488', 'weapon2': '1.738'} +[2023-09-14 14:51:35,424][63734] DAMAGECOUNT value on done: 6403.0 +[2023-09-14 14:51:35,425][63734] Sum rewards: -4.329, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.240', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'weapon5': '0.048', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.056', 'HITCOUNT': '0.060', 'ARMOR': '0.062', 'AMMO3': '0.126', 'weapon4': '0.142', 'DAMAGECOUNT': '0.165', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.700', 'weapon3': '1.428', 'weapon2': '1.500'} +[2023-09-14 14:51:35,456][63767] DAMAGECOUNT value on done: 7616.0 +[2023-09-14 14:51:35,456][63767] Sum rewards: -1.256, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.774', 'AMMO4': '-0.060', 'AMMO2': '-0.012', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'ARMOR': '0.020', 'AMMO3': '0.105', 'HITCOUNT': '0.180', 'weapon5': '0.224', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.700', 'weapon2': '1.316', 'weapon3': '1.954', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:35,816][63767] DAMAGECOUNT value on done: 7460.0 +[2023-09-14 14:51:35,817][63767] Sum rewards: -2.475, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.332', 'FRAGCOUNT': '0.000', 'AMMO2': '0.003', 'AMMO5': '0.009', 'AMMO4': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'weapon5': '0.048', 'AMMO3': '0.166', 'WEAPON5': '0.200', 'HITCOUNT': '0.240', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.020', 'weapon2': '1.392', 'weapon3': '1.604'} +[2023-09-14 14:51:35,836][63734] DAMAGECOUNT value on done: 5326.0 +[2023-09-14 14:51:35,837][63734] Sum rewards: 1.929, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.116', 'AMMO4': '-0.055', 'AMMO2': '-0.011', 'AMMO5': '0.007', 'WEAPON1': '0.030', 'AMMO3': '0.143', 'WEAPON5': '0.150', 'weapon5': '0.156', 'HITCOUNT': '0.190', 'ARMOR': '0.484', 'WEAPON3': '0.600', 'weapon2': '1.064', 'DAMAGECOUNT': '1.482', 'weapon3': '1.804', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:51:36,455][63771] DAMAGECOUNT value on done: 6728.0 +[2023-09-14 14:51:36,456][63771] Sum rewards: -5.587, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.832', 'AMMO2': '0.002', 'AMMO4': '0.008', 'ARMOR': '0.020', 'AMMO5': '0.023', 'weapon5': '0.050', 'AMMO3': '0.174', 'WEAPON5': '0.200', 'HITCOUNT': '0.360', 'WEAPON3': '0.900', 'weapon2': '1.328', 'DAMAGECOUNT': '1.485', 'FRAGCOUNT': '1.500', 'weapon3': '2.196'} +[2023-09-14 14:51:36,852][63771] DAMAGECOUNT value on done: 4565.0 +[2023-09-14 14:51:36,853][63771] Sum rewards: -5.582, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.318', 'AMMO2': '0.007', 'AMMO4': '0.033', 'ARMOR': '0.096', 'AMMO3': '0.139', 'HITCOUNT': '0.200', 'DAMAGECOUNT': '0.669', 'WEAPON3': '0.750', 'weapon2': '1.412', 'weapon3': '1.680', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:39,297][63732] Updated weights for policy 0, policy_version 1240 (0.0010) +[2023-09-14 14:51:39,521][63769] DAMAGECOUNT value on done: 4718.0 +[2023-09-14 14:51:39,521][63769] Sum rewards: -1.361, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.020', 'AMMO2': '0.008', 'AMMO4': '0.038', 'ARMOR': '0.048', 'WEAPON4': '0.100', 'AMMO3': '0.124', 'weapon4': '0.140', 'HITCOUNT': '0.290', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.047', 'weapon3': '1.596', 'weapon2': '1.768', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:39,742][63733] Updated weights for policy 1, policy_version 1220 (0.0010) +[2023-09-14 14:51:39,940][63769] DAMAGECOUNT value on done: 6409.0 +[2023-09-14 14:51:39,941][63769] Sum rewards: -2.478, reward structure: {'DEATHCOUNT': '-10.500', 'AMMO5': '0.003', 'weapon5': '0.014', 'AMMO2': '0.024', 'WEAPON5': '0.050', 'HEALTH': '0.054', 'ARMOR': '0.112', 'AMMO4': '0.118', 'AMMO3': '0.134', 'HITCOUNT': '0.260', 'WEAPON4': '0.300', 'weapon4': '0.304', 'DAMAGECOUNT': '0.717', 'WEAPON3': '0.800', 'weapon2': '1.286', 'weapon3': '1.846', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:42,703][63770] DAMAGECOUNT value on done: 6855.0 +[2023-09-14 14:51:43,123][63770] DAMAGECOUNT value on done: 4003.0 +[2023-09-14 14:51:43,123][63770] Sum rewards: -4.399, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.298', 'AMMO2': '0.001', 'AMMO4': '0.005', 'weapon5': '0.012', 'AMMO5': '0.017', 'AMMO3': '0.082', 'HITCOUNT': '0.110', 'WEAPON5': '0.250', 'ARMOR': '0.400', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.330', 'weapon2': '1.696'} +[2023-09-14 14:51:44,995][63735] DAMAGECOUNT value on done: 5627.0 +[2023-09-14 14:51:45,371][63735] DAMAGECOUNT value on done: 5801.0 +[2023-09-14 14:51:45,371][63735] Sum rewards: -6.165, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.701', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.010', 'AMMO5': '0.029', 'AMMO4': '0.048', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'AMMO3': '0.116', 'weapon5': '0.134', 'weapon4': '0.242', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.684', 'WEAPON3': '0.750', 'ARMOR': '0.949', 'weapon2': '1.236', 'weapon3': '1.748'} +[2023-09-14 14:51:45,380][63806] DAMAGECOUNT value on done: 5895.0 +[2023-09-14 14:51:45,381][63806] Sum rewards: -2.325, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.212', 'AMMO2': '0.002', 'AMMO4': '0.007', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'AMMO5': '0.028', 'weapon5': '0.090', 'AMMO3': '0.138', 'HITCOUNT': '0.270', 'WEAPON5': '0.450', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.927', 'weapon2': '1.530', 'weapon3': '1.652', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:45,734][63806] DAMAGECOUNT value on done: 5782.0 +[2023-09-14 14:51:45,734][63806] Sum rewards: -1.147, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.660', 'AMMO2': '0.012', 'weapon4': '0.016', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.061', 'AMMO3': '0.099', 'WEAPON4': '0.100', 'HITCOUNT': '0.190', 'WEAPON5': '0.400', 'weapon5': '0.438', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.978', 'weapon3': '1.278', 'weapon2': '1.722', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:45,991][63732] Updated weights for policy 0, policy_version 1250 (0.0011) +[2023-09-14 14:51:48,128][63733] Updated weights for policy 1, policy_version 1230 (0.0010) +[2023-09-14 14:51:48,887][63769] Large shaping reward -2.504 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.255, -85.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:51:49,210][63805] DAMAGECOUNT value on done: 7518.0 +[2023-09-14 14:51:49,567][63805] DAMAGECOUNT value on done: 4510.0 +[2023-09-14 14:51:49,568][63805] Sum rewards: -4.132, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.396', 'AMMO2': '0.001', 'AMMO4': '0.002', 'AMMO5': '0.005', 'ARMOR': '0.020', 'weapon5': '0.020', 'WEAPON5': '0.100', 'HITCOUNT': '0.120', 'AMMO3': '0.143', 'WEAPON4': '0.200', 'weapon4': '0.230', 'DAMAGECOUNT': '0.369', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.346', 'weapon2': '1.358'} +[2023-09-14 14:51:50,447][63735] DAMAGECOUNT value on done: 6217.0 +[2023-09-14 14:51:50,448][63735] Sum rewards: -0.246, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.996', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.012', 'AMMO2': '0.026', 'AMMO4': '0.128', 'AMMO3': '0.133', 'weapon5': '0.176', 'WEAPON5': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon4': '0.270', 'HITCOUNT': '0.290', 'WEAPON4': '0.300', 'ARMOR': '0.492', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.915', 'weapon2': '1.126', 'weapon3': '1.832'} +[2023-09-14 14:51:50,863][63735] DAMAGECOUNT value on done: 3851.0 +[2023-09-14 14:51:50,864][63735] Sum rewards: -3.702, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.578', 'AMMO5': '0.003', 'weapon5': '0.006', 'AMMO2': '0.011', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'WEAPON5': '0.050', 'AMMO4': '0.052', 'HITCOUNT': '0.140', 'AMMO3': '0.158', 'WEAPON4': '0.200', 'weapon4': '0.246', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.850', 'weapon3': '1.520', 'weapon2': '1.704', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:52,123][63734] DAMAGECOUNT value on done: 5480.0 +[2023-09-14 14:51:52,123][63734] Sum rewards: 0.223, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.351', 'AMMO2': '0.008', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.040', 'weapon5': '0.060', 'ARMOR': '0.064', 'AMMO3': '0.194', 'WEAPON5': '0.200', 'HITCOUNT': '0.290', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.047', 'weapon2': '1.558', 'weapon3': '1.980', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:51:52,482][63732] Updated weights for policy 0, policy_version 1260 (0.0011) +[2023-09-14 14:51:52,517][63734] DAMAGECOUNT value on done: 4539.0 +[2023-09-14 14:51:52,518][63734] Sum rewards: -5.045, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.908', 'AMMO5': '0.012', 'AMMO2': '0.023', 'ARMOR': '0.048', 'weapon5': '0.062', 'HITCOUNT': '0.080', 'WEAPON4': '0.100', 'AMMO4': '0.115', 'weapon4': '0.128', 'AMMO3': '0.162', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.375', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon2': '1.102', 'weapon3': '2.106'} +[2023-09-14 14:51:53,699][63806] DAMAGECOUNT value on done: 4683.0 +[2023-09-14 14:51:53,780][63769] DAMAGECOUNT value on done: 6603.0 +[2023-09-14 14:51:53,781][63769] Sum rewards: -0.750, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.768', 'AMMO2': '0.001', 'AMMO4': '0.002', 'AMMO5': '0.018', 'weapon7': '0.028', 'ARMOR': '0.032', 'AMMO3': '0.099', 'WEAPON4': '0.100', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'weapon5': '0.132', 'HITCOUNT': '0.150', 'weapon4': '0.206', 'WEAPON5': '0.300', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.615', 'weapon3': '1.402', 'weapon2': '1.532'} +[2023-09-14 14:51:53,785][63770] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:51:54,064][63806] DAMAGECOUNT value on done: 7000.0 +[2023-09-14 14:51:54,065][63806] Sum rewards: -3.537, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.032', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'AMMO5': '0.022', 'AMMO4': '0.044', 'weapon5': '0.114', 'AMMO3': '0.128', 'HITCOUNT': '0.160', 'WEAPON4': '0.350', 'WEAPON5': '0.350', 'ARMOR': '0.512', 'weapon4': '0.524', 'DAMAGECOUNT': '0.678', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.416', 'weapon3': '1.478'} +[2023-09-14 14:51:54,110][63769] DAMAGECOUNT value on done: 4699.0 +[2023-09-14 14:51:54,111][63769] Sum rewards: -0.150, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.010', 'HEALTH': '0.016', 'AMMO2': '0.020', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'weapon7': '0.074', 'AMMO4': '0.099', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.116', 'WEAPON5': '0.150', 'weapon4': '0.150', 'HITCOUNT': '0.160', 'weapon5': '0.160', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.975', 'weapon3': '1.412', 'FRAGCOUNT': '1.500', 'weapon2': '1.568'} +[2023-09-14 14:51:54,119][63767] DAMAGECOUNT value on done: 6715.0 +[2023-09-14 14:51:54,119][63767] Sum rewards: -3.646, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.670', 'AMMO5': '0.007', 'weapon5': '0.008', 'AMMO2': '0.010', 'WEAPON1': '0.020', 'ARMOR': '0.035', 'AMMO4': '0.052', 'AMMO3': '0.104', 'HITCOUNT': '0.110', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'weapon4': '0.284', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.586', 'weapon2': '1.632'} +[2023-09-14 14:51:54,155][63770] DAMAGECOUNT value on done: 5055.0 +[2023-09-14 14:51:54,155][63770] Sum rewards: -4.760, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.844', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.011', 'AMMO5': '0.012', 'weapon5': '0.032', 'WEAPON4': '0.050', 'AMMO4': '0.056', 'AMMO3': '0.110', 'HITCOUNT': '0.150', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.741', 'WEAPON3': '0.750', 'weapon2': '1.666', 'weapon3': '1.756'} +[2023-09-14 14:51:54,464][63767] DAMAGECOUNT value on done: 6575.0 +[2023-09-14 14:51:54,464][63767] Sum rewards: -5.443, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.912', 'AMMO2': '0.008', 'AMMO5': '0.010', 'AMMO4': '0.038', 'weapon5': '0.064', 'ARMOR': '0.068', 'AMMO3': '0.119', 'weapon4': '0.126', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.516', 'WEAPON3': '0.850', 'weapon2': '1.430', 'weapon3': '1.470', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:51:54,569][63770] DAMAGECOUNT value on done: 5654.0 +[2023-09-14 14:51:54,570][63770] Sum rewards: -2.362, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.940', 'AMMO4': '-0.042', 'AMMO2': '-0.008', 'AMMO5': '0.010', 'ARMOR': '0.015', 'weapon5': '0.076', 'weapon7': '0.104', 'HITCOUNT': '0.110', 'AMMO3': '0.141', 'WEAPON5': '0.200', 'AMMO6': '0.220', 'AMMO7': '0.220', 'WEAPON7': '0.300', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.020', 'weapon2': '1.200', 'FRAGCOUNT': '2.000', 'weapon3': '2.262'} +[2023-09-14 14:51:55,057][63771] DAMAGECOUNT value on done: 3480.0 +[2023-09-14 14:51:55,440][63771] DAMAGECOUNT value on done: 5686.0 +[2023-09-14 14:51:56,573][63733] Updated weights for policy 1, policy_version 1240 (0.0011) +[2023-09-14 14:51:57,466][63576] Saving new best policy, reward=-4.119! +[2023-09-14 14:51:58,825][63767] DAMAGECOUNT value on done: 7721.0 +[2023-09-14 14:51:58,825][63767] Sum rewards: -3.001, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.972', 'AMMO2': '0.011', 'AMMO5': '0.018', 'WEAPON4': '0.050', 'AMMO4': '0.053', 'AMMO3': '0.108', 'HITCOUNT': '0.120', 'weapon5': '0.200', 'WEAPON5': '0.250', 'weapon4': '0.284', 'DAMAGECOUNT': '0.315', 'ARMOR': '0.528', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.074', 'weapon2': '1.610'} +[2023-09-14 14:51:59,089][63732] Updated weights for policy 0, policy_version 1270 (0.0012) +[2023-09-14 14:51:59,190][63767] DAMAGECOUNT value on done: 7707.0 +[2023-09-14 14:51:59,190][63767] Sum rewards: 1.112, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.036', 'AMMO5': '0.010', 'weapon4': '0.014', 'AMMO2': '0.016', 'weapon5': '0.018', 'WEAPON4': '0.050', 'AMMO4': '0.079', 'WEAPON5': '0.100', 'AMMO3': '0.124', 'HITCOUNT': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.741', 'ARMOR': '0.876', 'weapon2': '1.364', 'weapon3': '2.206', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:51:59,594][63805] DAMAGECOUNT value on done: 7252.0 +[2023-09-14 14:51:59,595][63805] Sum rewards: -2.611, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.505', 'AMMO4': '-0.029', 'AMMO2': '-0.006', 'AMMO5': '0.010', 'weapon7': '0.050', 'WEAPON4': '0.100', 'weapon5': '0.116', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon4': '0.134', 'WEAPON5': '0.150', 'AMMO3': '0.163', 'WEAPON7': '0.200', 'HITCOUNT': '0.340', 'ARMOR': '0.536', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.150', 'weapon2': '1.340', 'DAMAGECOUNT': '1.395', 'weapon3': '2.004'} +[2023-09-14 14:52:00,011][63805] DAMAGECOUNT value on done: 6275.0 +[2023-09-14 14:52:00,011][63805] Sum rewards: 0.567, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO2': '0.007', 'AMMO5': '0.008', 'WEAPON1': '0.020', 'AMMO4': '0.035', 'HEALTH': '0.082', 'weapon5': '0.100', 'AMMO3': '0.111', 'WEAPON5': '0.150', 'HITCOUNT': '0.280', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.972', 'weapon2': '1.412', 'weapon3': '1.590', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:52:00,899][63734] DAMAGECOUNT value on done: 6601.0 +[2023-09-14 14:52:00,899][63734] Sum rewards: -2.816, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.529', 'AMMO5': '0.005', 'weapon5': '0.014', 'AMMO2': '0.033', 'ARMOR': '0.064', 'AMMO3': '0.090', 'WEAPON5': '0.100', 'AMMO4': '0.163', 'HITCOUNT': '0.170', 'WEAPON4': '0.250', 'weapon4': '0.360', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.594', 'FRAGCOUNT': '1.000', 'weapon3': '1.018', 'weapon2': '1.702'} +[2023-09-14 14:52:01,328][63734] DAMAGECOUNT value on done: 5519.0 +[2023-09-14 14:52:01,329][63734] Sum rewards: -3.512, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.000', 'weapon4': '0.002', 'AMMO2': '0.014', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.070', 'AMMO3': '0.092', 'weapon5': '0.124', 'HITCOUNT': '0.190', 'WEAPON5': '0.250', 'HEALTH': '0.364', 'ARMOR': '0.480', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.579', 'weapon2': '1.062', 'weapon3': '1.874'} +[2023-09-14 14:52:01,550][63771] DAMAGECOUNT value on done: 6859.0 +[2023-09-14 14:52:01,551][63771] Sum rewards: 1.729, reward structure: {'DEATHCOUNT': '-4.500', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.018', 'AMMO3': '0.050', 'AMMO4': '0.089', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'weapon7': '0.124', 'weapon5': '0.184', 'WEAPON3': '0.250', 'HEALTH': '0.268', 'DAMAGECOUNT': '0.393', 'ARMOR': '0.464', 'FRAGCOUNT': '1.000', 'weapon3': '1.260', 'weapon2': '1.604'} +[2023-09-14 14:52:01,981][63771] DAMAGECOUNT value on done: 4717.0 +[2023-09-14 14:52:01,982][63771] Sum rewards: -5.476, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.036', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.010', 'WEAPON1': '0.020', 'ARMOR': '0.028', 'WEAPON5': '0.050', 'AMMO4': '0.050', 'AMMO3': '0.118', 'WEAPON4': '0.150', 'weapon4': '0.188', 'HITCOUNT': '0.200', 'DAMAGECOUNT': '0.456', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.472', 'weapon2': '1.654'} +[2023-09-14 14:52:02,462][63576] Saving new best policy, reward=-4.061! +[2023-09-14 14:52:04,789][63769] DAMAGECOUNT value on done: 5836.0 +[2023-09-14 14:52:04,790][63769] Sum rewards: -1.796, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.666', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.010', 'AMMO5': '0.020', 'ARMOR': '0.044', 'AMMO4': '0.047', 'weapon7': '0.054', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.109', 'HITCOUNT': '0.200', 'weapon5': '0.204', 'WEAPON5': '0.350', 'WEAPON3': '0.700', 'weapon2': '1.342', 'weapon3': '1.636', 'DAMAGECOUNT': '1.854'} +[2023-09-14 14:52:05,186][63733] Updated weights for policy 1, policy_version 1250 (0.0013) +[2023-09-14 14:52:05,218][63769] DAMAGECOUNT value on done: 6550.0 +[2023-09-14 14:52:05,219][63769] Sum rewards: -1.741, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO5': '0.005', 'weapon5': '0.020', 'AMMO2': '0.028', 'ARMOR': '0.040', 'weapon4': '0.042', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'AMMO3': '0.061', 'AMMO4': '0.138', 'HITCOUNT': '0.170', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.423', 'HEALTH': '0.758', 'FRAGCOUNT': '1.000', 'weapon3': '1.200', 'weapon2': '2.174'} +[2023-09-14 14:52:05,701][63732] Updated weights for policy 0, policy_version 1280 (0.0011) +[2023-09-14 14:52:07,470][63576] Saving new best policy, reward=-4.021! +[2023-09-14 14:52:08,146][63770] DAMAGECOUNT value on done: 7299.0 +[2023-09-14 14:52:08,147][63770] Sum rewards: -0.156, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.490', 'AMMO4': '-0.042', 'AMMO2': '-0.008', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'weapon5': '0.046', 'weapon7': '0.066', 'AMMO3': '0.091', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'weapon4': '0.236', 'HITCOUNT': '0.330', 'WEAPON3': '0.700', 'ARMOR': '0.928', 'FRAGCOUNT': '1.000', 'weapon2': '1.206', 'DAMAGECOUNT': '1.332', 'weapon3': '1.532'} +[2023-09-14 14:52:08,424][63806] DAMAGECOUNT value on done: 6037.0 +[2023-09-14 14:52:08,425][63806] Sum rewards: -2.341, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.286', 'AMMO5': '0.015', 'AMMO2': '0.016', 'weapon5': '0.042', 'AMMO4': '0.081', 'AMMO3': '0.092', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'ARMOR': '0.108', 'HITCOUNT': '0.120', 'WEAPON5': '0.150', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.426', 'weapon4': '0.450', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.128', 'weapon3': '1.616'} +[2023-09-14 14:52:08,565][63770] DAMAGECOUNT value on done: 4160.0 +[2023-09-14 14:52:08,739][63806] DAMAGECOUNT value on done: 5932.0 +[2023-09-14 14:52:08,740][63806] Sum rewards: 1.867, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.003', 'AMMO2': '0.019', 'weapon5': '0.030', 'WEAPON5': '0.050', 'ARMOR': '0.064', 'AMMO3': '0.090', 'AMMO4': '0.095', 'HITCOUNT': '0.110', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.450', 'HEALTH': '0.516', 'weapon2': '1.564', 'weapon3': '1.776', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:52:09,773][63735] DAMAGECOUNT value on done: 6027.0 +[2023-09-14 14:52:09,773][63735] Sum rewards: -3.133, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.051', 'AMMO2': '0.007', 'ARMOR': '0.032', 'AMMO4': '0.033', 'AMMO3': '0.130', 'WEAPON4': '0.150', 'HITCOUNT': '0.290', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.200', 'weapon2': '1.684', 'weapon3': '1.692', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:52:10,106][63735] DAMAGECOUNT value on done: 5856.0 +[2023-09-14 14:52:10,106][63735] Sum rewards: 0.247, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.214', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.019', 'WEAPON5': '0.050', 'HITCOUNT': '0.050', 'weapon5': '0.060', 'AMMO3': '0.075', 'AMMO4': '0.094', 'ARMOR': '0.096', 'weapon7': '0.158', 'DAMAGECOUNT': '0.165', 'WEAPON4': '0.200', 'AMMO6': '0.300', 'WEAPON7': '0.300', 'AMMO7': '0.300', 'WEAPON3': '0.350', 'weapon4': '0.558', 'weapon3': '0.922', 'FRAGCOUNT': '1.000', 'weapon2': '1.752'} +[2023-09-14 14:52:12,237][63732] Updated weights for policy 0, policy_version 1290 (0.0011) +[2023-09-14 14:52:13,922][63733] Updated weights for policy 1, policy_version 1260 (0.0011) +[2023-09-14 14:52:14,326][63805] DAMAGECOUNT value on done: 7993.0 +[2023-09-14 14:52:14,327][63805] Sum rewards: -2.789, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.766', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'ARMOR': '0.012', 'AMMO2': '0.015', 'weapon5': '0.040', 'AMMO4': '0.072', 'weapon4': '0.074', 'AMMO3': '0.131', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'HITCOUNT': '0.350', 'WEAPON3': '0.800', 'weapon2': '0.854', 'DAMAGECOUNT': '1.425', 'FRAGCOUNT': '2.000', 'weapon3': '2.534'} +[2023-09-14 14:52:14,753][63805] DAMAGECOUNT value on done: 4760.0 +[2023-09-14 14:52:14,753][63805] Sum rewards: -3.452, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.086', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.060', 'weapon4': '0.108', 'AMMO3': '0.127', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.750', 'weapon3': '1.666', 'weapon2': '1.788', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:52:15,446][63735] DAMAGECOUNT value on done: 6527.0 +[2023-09-14 14:52:15,447][63735] Sum rewards: -1.432, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.280', 'AMMO2': '0.003', 'weapon4': '0.006', 'AMMO5': '0.010', 'ARMOR': '0.012', 'AMMO4': '0.017', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'weapon5': '0.110', 'AMMO3': '0.135', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.930', 'weapon2': '1.160', 'FRAGCOUNT': '2.000', 'weapon3': '2.214'} +[2023-09-14 14:52:15,822][63734] DAMAGECOUNT value on done: 6065.0 +[2023-09-14 14:52:15,823][63734] Sum rewards: 1.770, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.504', 'AMMO4': '-0.020', 'AMMO2': '-0.004', 'WEAPON1': '0.010', 'AMMO5': '0.020', 'weapon7': '0.072', 'AMMO3': '0.084', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon5': '0.172', 'weapon4': '0.196', 'WEAPON7': '0.200', 'HITCOUNT': '0.240', 'WEAPON5': '0.350', 'ARMOR': '0.449', 'WEAPON3': '0.650', 'weapon2': '1.446', 'weapon3': '1.564', 'DAMAGECOUNT': '1.755', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:52:15,828][63735] DAMAGECOUNT value on done: 4100.0 +[2023-09-14 14:52:15,828][63735] Sum rewards: -1.161, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.060', 'AMMO2': '0.004', 'weapon4': '0.010', 'WEAPON1': '0.020', 'AMMO4': '0.021', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'AMMO3': '0.113', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.747', 'WEAPON3': '0.750', 'weapon2': '1.708', 'weapon3': '1.730', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:52:16,219][63734] DAMAGECOUNT value on done: 4917.0 +[2023-09-14 14:52:16,220][63734] Sum rewards: -1.574, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.792', 'AMMO2': '0.004', 'AMMO5': '0.017', 'AMMO4': '0.018', 'WEAPON1': '0.020', 'AMMO3': '0.113', 'WEAPON4': '0.200', 'HITCOUNT': '0.270', 'weapon5': '0.278', 'weapon4': '0.302', 'WEAPON5': '0.400', 'ARMOR': '0.484', 'WEAPON3': '0.750', 'weapon3': '1.060', 'DAMAGECOUNT': '1.134', 'weapon2': '1.418', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:52:16,557][63767] DAMAGECOUNT value on done: 6935.0 +[2023-09-14 14:52:16,558][63767] Sum rewards: -3.600, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.773', 'AMMO2': '0.021', 'ARMOR': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.103', 'AMMO4': '0.103', 'HITCOUNT': '0.120', 'weapon4': '0.224', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.660', 'FRAGCOUNT': '1.000', 'weapon3': '1.286', 'weapon2': '1.956'} +[2023-09-14 14:52:16,947][63767] DAMAGECOUNT value on done: 6740.0 +[2023-09-14 14:52:16,948][63767] Sum rewards: -2.769, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.104', 'AMMO5': '0.007', 'AMMO2': '0.014', 'ARMOR': '0.036', 'weapon5': '0.038', 'AMMO4': '0.072', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.122', 'HITCOUNT': '0.170', 'weapon4': '0.194', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.700', 'weapon3': '1.440', 'weapon2': '1.596', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:52:17,466][63576] Saving new best policy, reward=-3.891! +[2023-09-14 14:52:17,688][63769] DAMAGECOUNT value on done: 6851.0 +[2023-09-14 14:52:17,689][63769] Sum rewards: -5.008, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.005', 'AMMO2': '0.012', 'AMMO5': '0.025', 'weapon5': '0.032', 'AMMO4': '0.059', 'ARMOR': '0.064', 'weapon7': '0.072', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.133', 'HITCOUNT': '0.160', 'WEAPON7': '0.200', 'WEAPON5': '0.350', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.744', 'WEAPON3': '0.850', 'weapon2': '1.324', 'weapon3': '1.982'} +[2023-09-14 14:52:18,065][63771] DAMAGECOUNT value on done: 3675.0 +[2023-09-14 14:52:18,066][63771] Sum rewards: -5.281, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.638', 'AMMO5': '0.005', 'AMMO2': '0.007', 'weapon5': '0.012', 'AMMO4': '0.034', 'ARMOR': '0.066', 'AMMO3': '0.090', 'WEAPON5': '0.100', 'HITCOUNT': '0.160', 'WEAPON4': '0.250', 'weapon4': '0.320', 'DAMAGECOUNT': '0.585', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.390', 'weapon3': '1.488'} +[2023-09-14 14:52:18,090][63769] DAMAGECOUNT value on done: 4942.0 +[2023-09-14 14:52:18,090][63769] Sum rewards: -2.890, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.090', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.012', 'AMMO2': '0.016', 'weapon5': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.077', 'weapon4': '0.098', 'AMMO3': '0.114', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'ARMOR': '0.476', 'DAMAGECOUNT': '0.729', 'WEAPON3': '0.800', 'weapon2': '1.354', 'weapon3': '2.054'} +[2023-09-14 14:52:18,412][63771] DAMAGECOUNT value on done: 5963.0 +[2023-09-14 14:52:18,412][63771] Sum rewards: -3.628, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.294', 'AMMO5': '0.005', 'AMMO2': '0.007', 'weapon5': '0.018', 'AMMO4': '0.033', 'ARMOR': '0.048', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.186', 'weapon4': '0.198', 'HITCOUNT': '0.250', 'DAMAGECOUNT': '0.831', 'WEAPON3': '0.900', 'weapon3': '1.608', 'weapon2': '1.632', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:52:18,422][63732] Updated weights for policy 0, policy_version 1300 (0.0012) +[2023-09-14 14:52:18,514][63806] DAMAGECOUNT value on done: 4773.0 +[2023-09-14 14:52:18,867][63806] DAMAGECOUNT value on done: 7374.0 +[2023-09-14 14:52:18,867][63806] Sum rewards: 1.062, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.279', 'AMMO2': '0.009', 'AMMO5': '0.014', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'AMMO4': '0.043', 'WEAPON4': '0.050', 'weapon4': '0.052', 'AMMO3': '0.126', 'weapon5': '0.228', 'HITCOUNT': '0.280', 'WEAPON5': '0.300', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.122', 'weapon2': '1.280', 'weapon3': '1.866', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:52:19,907][63770] DAMAGECOUNT value on done: 5318.0 +[2023-09-14 14:52:20,251][63770] DAMAGECOUNT value on done: 5831.0 +[2023-09-14 14:52:20,252][63770] Sum rewards: -10.862, reward structure: {'DEATHCOUNT': '-13.500', 'FRAGCOUNT': '-3.000', 'HEALTH': '-1.074', 'AMMO5': '0.014', 'AMMO2': '0.020', 'ARMOR': '0.032', 'weapon5': '0.096', 'WEAPON4': '0.100', 'AMMO4': '0.101', 'HITCOUNT': '0.140', 'weapon4': '0.146', 'AMMO3': '0.199', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.531', 'WEAPON3': '1.050', 'weapon2': '1.670', 'weapon3': '1.712'} +[2023-09-14 14:52:22,330][63767] DAMAGECOUNT value on done: 8005.0 +[2023-09-14 14:52:22,331][63767] Sum rewards: 1.065, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.086', 'AMMO5': '0.007', 'AMMO2': '0.013', 'weapon5': '0.030', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'weapon4': '0.056', 'AMMO4': '0.066', 'AMMO3': '0.142', 'WEAPON5': '0.150', 'HITCOUNT': '0.210', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.852', 'weapon3': '1.730', 'weapon2': '1.862', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:52:22,750][63767] DAMAGECOUNT value on done: 7825.0 +[2023-09-14 14:52:23,126][63733] Updated weights for policy 1, policy_version 1270 (0.0013) +[2023-09-14 14:52:24,696][63732] Updated weights for policy 0, policy_version 1310 (0.0011) +[2023-09-14 14:52:24,748][63805] DAMAGECOUNT value on done: 7365.0 +[2023-09-14 14:52:25,132][63805] DAMAGECOUNT value on done: 6591.0 +[2023-09-14 14:52:25,133][63805] Sum rewards: -2.989, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.152', 'AMMO2': '0.011', 'AMMO5': '0.012', 'AMMO4': '0.055', 'AMMO3': '0.071', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'weapon4': '0.186', 'WEAPON5': '0.200', 'weapon5': '0.226', 'WEAPON3': '0.500', 'weapon3': '0.882', 'DAMAGECOUNT': '0.948', 'FRAGCOUNT': '1.500', 'weapon2': '1.772'} +[2023-09-14 14:52:26,084][63734] DAMAGECOUNT value on done: 6831.0 +[2023-09-14 14:52:26,084][63734] Sum rewards: -1.565, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.712', 'AMMO2': '0.001', 'AMMO4': '0.006', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'weapon5': '0.024', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'weapon4': '0.054', 'AMMO3': '0.089', 'HITCOUNT': '0.140', 'WEAPON5': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.690', 'weapon3': '1.284', 'weapon2': '1.936', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:52:26,472][63734] DAMAGECOUNT value on done: 5814.0 +[2023-09-14 14:52:26,472][63734] Sum rewards: -6.395, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.290', 'FRAGCOUNT': '-0.500', 'weapon4': '0.010', 'AMMO5': '0.015', 'WEAPON1': '0.030', 'AMMO2': '0.030', 'AMMO3': '0.138', 'WEAPON4': '0.150', 'AMMO4': '0.151', 'weapon5': '0.156', 'HITCOUNT': '0.230', 'WEAPON5': '0.350', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.885', 'weapon2': '1.138', 'weapon3': '1.762'} +[2023-09-14 14:52:26,783][63771] DAMAGECOUNT value on done: 7324.0 +[2023-09-14 14:52:26,783][63771] Sum rewards: -2.841, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.886', 'AMMO2': '0.009', 'weapon7': '0.038', 'AMMO4': '0.045', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.167', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.258', 'HITCOUNT': '0.350', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.395', 'weapon2': '1.496', 'weapon3': '1.796', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:52:27,186][63771] DAMAGECOUNT value on done: 4877.0 +[2023-09-14 14:52:27,186][63771] Sum rewards: -2.762, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.860', 'AMMO5': '0.005', 'AMMO2': '0.008', 'WEAPON1': '0.020', 'AMMO4': '0.040', 'weapon5': '0.052', 'ARMOR': '0.060', 'WEAPON5': '0.100', 'AMMO3': '0.119', 'HITCOUNT': '0.160', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.800', 'weapon2': '1.498', 'weapon3': '1.756', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:52:27,467][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001274_5218304.pth... +[2023-09-14 14:52:27,467][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001314_5382144.pth... +[2023-09-14 14:52:27,528][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000000989_4050944.pth +[2023-09-14 14:52:27,529][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000000952_3899392.pth +[2023-09-14 14:52:27,536][63576] Saving new best policy, reward=-3.822! +[2023-09-14 14:52:30,141][63769] DAMAGECOUNT value on done: 6036.0 +[2023-09-14 14:52:30,142][63769] Sum rewards: -1.098, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.040', 'AMMO4': '-0.041', 'AMMO2': '-0.008', 'AMMO5': '0.005', 'weapon5': '0.042', 'ARMOR': '0.096', 'WEAPON5': '0.100', 'AMMO3': '0.110', 'HITCOUNT': '0.170', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.600', 'weapon2': '1.364', 'weapon3': '1.404', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:52:30,469][63769] DAMAGECOUNT value on done: 6695.0 +[2023-09-14 14:52:30,470][63769] Sum rewards: -3.110, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.730', 'AMMO2': '0.018', 'weapon4': '0.040', 'WEAPON4': '0.050', 'AMMO3': '0.073', 'HITCOUNT': '0.090', 'AMMO4': '0.091', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.435', 'weapon3': '1.242', 'FRAGCOUNT': '2.000', 'weapon2': '2.280'} +[2023-09-14 14:52:30,625][63732] Updated weights for policy 0, policy_version 1320 (0.0011) +[2023-09-14 14:52:31,579][63806] DAMAGECOUNT value on done: 6207.0 +[2023-09-14 14:52:31,580][63806] Sum rewards: -0.667, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO2': '0.004', 'AMMO5': '0.017', 'AMMO4': '0.018', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'HEALTH': '0.116', 'HITCOUNT': '0.130', 'AMMO3': '0.136', 'WEAPON5': '0.250', 'weapon5': '0.284', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.510', 'ARMOR': '0.510', 'WEAPON3': '0.700', 'weapon3': '1.402', 'weapon2': '1.956'} +[2023-09-14 14:52:31,994][63806] DAMAGECOUNT value on done: 6127.0 +[2023-09-14 14:52:31,994][63806] Sum rewards: -7.716, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.229', 'AMMO2': '0.003', 'AMMO4': '0.014', 'AMMO5': '0.018', 'WEAPON4': '0.050', 'ARMOR': '0.060', 'AMMO3': '0.156', 'HITCOUNT': '0.190', 'weapon4': '0.222', 'weapon5': '0.240', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.585', 'WEAPON3': '0.800', 'weapon2': '1.096', 'weapon3': '1.830'} +[2023-09-14 14:52:32,462][63576] Saving new best policy, reward=-3.805! +[2023-09-14 14:52:32,635][63733] Updated weights for policy 1, policy_version 1280 (0.0010) +[2023-09-14 14:52:33,303][63735] DAMAGECOUNT value on done: 6523.0 +[2023-09-14 14:52:33,303][63735] Sum rewards: -5.791, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-3.432', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'AMMO5': '0.016', 'WEAPON1': '0.020', 'weapon7': '0.022', 'ARMOR': '0.052', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.191', 'HITCOUNT': '0.200', 'weapon5': '0.216', 'WEAPON5': '0.400', 'WEAPON3': '0.950', 'weapon3': '1.278', 'DAMAGECOUNT': '1.488', 'weapon2': '2.022', 'FRAGCOUNT': '2.500'} +[2023-09-14 14:52:33,446][63770] DAMAGECOUNT value on done: 7471.0 +[2023-09-14 14:52:33,447][63770] Sum rewards: -6.407, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.520', 'AMMO2': '0.001', 'AMMO4': '0.006', 'AMMO5': '0.015', 'ARMOR': '0.020', 'WEAPON1': '0.030', 'weapon4': '0.034', 'WEAPON4': '0.050', 'weapon5': '0.076', 'weapon7': '0.080', 'HITCOUNT': '0.170', 'AMMO3': '0.195', 'WEAPON7': '0.200', 'AMMO6': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.516', 'WEAPON3': '1.050', 'weapon2': '1.404', 'FRAGCOUNT': '1.500', 'weapon3': '1.866'} +[2023-09-14 14:52:33,674][63735] DAMAGECOUNT value on done: 6121.0 +[2023-09-14 14:52:33,675][63735] Sum rewards: 0.537, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.520', 'AMMO2': '0.001', 'AMMO4': '0.005', 'AMMO5': '0.012', 'ARMOR': '0.036', 'AMMO3': '0.100', 'weapon5': '0.172', 'HITCOUNT': '0.270', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.795', 'weapon2': '1.022', 'weapon3': '2.244', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:52:33,839][63770] DAMAGECOUNT value on done: 4445.0 +[2023-09-14 14:52:33,839][63770] Sum rewards: -2.303, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.073', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.016', 'weapon5': '0.022', 'WEAPON4': '0.050', 'AMMO4': '0.082', 'WEAPON5': '0.100', 'AMMO3': '0.110', 'HITCOUNT': '0.130', 'weapon4': '0.180', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.855', 'FRAGCOUNT': '1.000', 'weapon3': '1.450', 'weapon2': '1.710'} +[2023-09-14 14:52:36,576][63732] Updated weights for policy 0, policy_version 1330 (0.0012) +[2023-09-14 14:52:37,528][63576] Saving new best policy, reward=-3.768! +[2023-09-14 14:52:38,916][63767] DAMAGECOUNT value on done: 7107.0 +[2023-09-14 14:52:39,192][63735] Large shaping reward -2.504 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.255, -85.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:52:39,263][63767] DAMAGECOUNT value on done: 6950.0 +[2023-09-14 14:52:39,264][63767] Sum rewards: -3.959, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.825', 'AMMO4': '-0.045', 'AMMO2': '-0.009', 'weapon5': '0.008', 'AMMO5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.056', 'AMMO3': '0.073', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.190', 'weapon4': '0.208', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.630', 'weapon3': '1.170', 'weapon2': '1.750'} +[2023-09-14 14:52:39,391][63805] DAMAGECOUNT value on done: 8493.0 +[2023-09-14 14:52:39,392][63805] Sum rewards: -3.169, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.408', 'AMMO2': '0.006', 'AMMO5': '0.018', 'AMMO4': '0.031', 'AMMO3': '0.185', 'weapon5': '0.228', 'HITCOUNT': '0.390', 'WEAPON5': '0.400', 'weapon2': '1.064', 'WEAPON3': '1.100', 'DAMAGECOUNT': '1.500', 'weapon3': '2.316', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:52:39,806][63734] DAMAGECOUNT value on done: 6360.0 +[2023-09-14 14:52:39,807][63734] Sum rewards: -3.445, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.478', 'AMMO2': '0.010', 'AMMO5': '0.028', 'ARMOR': '0.028', 'weapon4': '0.042', 'AMMO4': '0.049', 'WEAPON1': '0.050', 'weapon5': '0.090', 'WEAPON4': '0.100', 'AMMO3': '0.165', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.230', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.885', 'WEAPON3': '1.000', 'weapon2': '1.366', 'weapon3': '1.990', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:52:39,820][63805] DAMAGECOUNT value on done: 5045.0 +[2023-09-14 14:52:39,820][63805] Sum rewards: -1.205, reward structure: {'DEATHCOUNT': '-9.000', 'AMMO5': '0.010', 'weapon5': '0.012', 'AMMO2': '0.013', 'HEALTH': '0.018', 'AMMO4': '0.066', 'WEAPON4': '0.100', 'AMMO3': '0.103', 'weapon4': '0.112', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'ARMOR': '0.493', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.855', 'weapon3': '1.506', 'weapon2': '1.546', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:52:40,192][63734] DAMAGECOUNT value on done: 5119.0 +[2023-09-14 14:52:40,193][63734] Sum rewards: -3.586, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.478', 'AMMO5': '0.005', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.062', 'AMMO3': '0.121', 'weapon5': '0.138', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.606', 'WEAPON3': '0.750', 'ARMOR': '0.846', 'FRAGCOUNT': '1.500', 'weapon3': '1.544', 'weapon2': '1.718'} +[2023-09-14 14:52:40,234][63735] DAMAGECOUNT value on done: 7242.0 +[2023-09-14 14:52:40,235][63735] Sum rewards: -1.419, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.926', 'AMMO5': '0.010', 'AMMO2': '0.028', 'ARMOR': '0.040', 'WEAPON1': '0.040', 'weapon4': '0.050', 'AMMO4': '0.140', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon5': '0.152', 'AMMO3': '0.157', 'HITCOUNT': '0.410', 'WEAPON3': '0.850', 'weapon2': '1.696', 'weapon3': '1.738', 'DAMAGECOUNT': '2.145', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:52:40,537][63771] DAMAGECOUNT value on done: 3930.0 +[2023-09-14 14:52:40,596][63735] DAMAGECOUNT value on done: 4188.0 +[2023-09-14 14:52:40,596][63735] Sum rewards: -2.707, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.851', 'AMMO5': '0.007', 'AMMO2': '0.018', 'ARMOR': '0.032', 'AMMO3': '0.066', 'AMMO4': '0.089', 'HITCOUNT': '0.110', 'weapon5': '0.124', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.264', 'weapon4': '0.354', 'WEAPON3': '0.450', 'FRAGCOUNT': '0.500', 'weapon3': '1.186', 'weapon2': '1.394'} +[2023-09-14 14:52:40,932][63771] DAMAGECOUNT value on done: 6308.0 +[2023-09-14 14:52:40,933][63771] Sum rewards: -3.789, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.175', 'WEAPON1': '0.020', 'AMMO2': '0.039', 'ARMOR': '0.052', 'WEAPON4': '0.100', 'AMMO3': '0.151', 'AMMO4': '0.193', 'weapon4': '0.210', 'HITCOUNT': '0.250', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.035', 'weapon3': '1.576', 'weapon2': '1.710'} +[2023-09-14 14:52:41,660][63769] DAMAGECOUNT value on done: 7310.0 +[2023-09-14 14:52:41,660][63769] Sum rewards: 0.655, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.300', 'AMMO2': '0.006', 'ARMOR': '0.008', 'WEAPON1': '0.020', 'AMMO5': '0.025', 'AMMO4': '0.031', 'weapon7': '0.058', 'AMMO3': '0.073', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'weapon5': '0.218', 'HITCOUNT': '0.280', 'weapon4': '0.326', 'WEAPON5': '0.400', 'WEAPON3': '0.500', 'weapon2': '0.702', 'weapon3': '1.140', 'DAMAGECOUNT': '1.377', 'FRAGCOUNT': '1.500'} +[2023-09-14 14:52:42,048][63769] DAMAGECOUNT value on done: 5445.0 +[2023-09-14 14:52:42,049][63769] Sum rewards: 2.934, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.380', 'ARMOR': '0.008', 'AMMO2': '0.011', 'AMMO5': '0.013', 'AMMO4': '0.053', 'AMMO3': '0.096', 'weapon5': '0.176', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'weapon4': '0.336', 'WEAPON3': '0.550', 'weapon2': '1.270', 'DAMAGECOUNT': '1.509', 'weapon3': '1.622', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:52:42,474][63576] Saving new best policy, reward=-3.711! +[2023-09-14 14:52:42,478][63732] Updated weights for policy 0, policy_version 1340 (0.0012) +[2023-09-14 14:52:42,480][63733] Updated weights for policy 1, policy_version 1290 (0.0011) +[2023-09-14 14:52:42,524][63735] Large shaping reward -2.534 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.28500000000000003, -95.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:52:43,269][63806] DAMAGECOUNT value on done: 4828.0 +[2023-09-14 14:52:43,701][63806] DAMAGECOUNT value on done: 7869.0 +[2023-09-14 14:52:43,701][63806] Sum rewards: -0.760, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.719', 'AMMO2': '0.006', 'AMMO5': '0.010', 'AMMO4': '0.031', 'WEAPON4': '0.050', 'ARMOR': '0.059', 'weapon4': '0.076', 'WEAPON5': '0.100', 'AMMO3': '0.132', 'weapon5': '0.168', 'HITCOUNT': '0.360', 'WEAPON3': '0.900', 'weapon2': '0.914', 'DAMAGECOUNT': '1.485', 'FRAGCOUNT': '1.500', 'weapon3': '2.418'} +[2023-09-14 14:52:45,074][63770] DAMAGECOUNT value on done: 5574.0 +[2023-09-14 14:52:45,075][63770] Sum rewards: -1.853, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.678', 'AMMO4': '-0.004', 'AMMO2': '-0.001', 'AMMO5': '0.003', 'ARMOR': '0.020', 'WEAPON5': '0.050', 'AMMO3': '0.105', 'weapon5': '0.116', 'HITCOUNT': '0.190', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.768', 'FRAGCOUNT': '1.000', 'weapon3': '1.280', 'weapon2': '1.448'} +[2023-09-14 14:52:45,441][63770] DAMAGECOUNT value on done: 6403.0 +[2023-09-14 14:52:45,441][63770] Sum rewards: 2.498, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.640', 'AMMO2': '0.005', 'AMMO5': '0.016', 'WEAPON1': '0.020', 'AMMO4': '0.025', 'AMMO3': '0.117', 'WEAPON4': '0.200', 'weapon4': '0.262', 'WEAPON5': '0.300', 'HITCOUNT': '0.360', 'weapon5': '0.372', 'ARMOR': '0.516', 'WEAPON3': '0.600', 'weapon3': '1.318', 'weapon2': '1.560', 'DAMAGECOUNT': '1.716', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:52:45,540][63767] DAMAGECOUNT value on done: 8259.0 +[2023-09-14 14:52:45,541][63767] Sum rewards: -1.651, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.528', 'AMMO2': '0.010', 'AMMO5': '0.021', 'AMMO4': '0.050', 'ARMOR': '0.088', 'WEAPON4': '0.100', 'AMMO3': '0.149', 'HITCOUNT': '0.150', 'weapon5': '0.162', 'weapon4': '0.302', 'WEAPON5': '0.350', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.762', 'weapon2': '1.432', 'weapon3': '1.600', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:52:45,920][63767] DAMAGECOUNT value on done: 8199.0 +[2023-09-14 14:52:45,921][63767] Sum rewards: -4.952, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-2.000', 'HEALTH': '-0.018', 'WEAPON1': '0.010', 'AMMO2': '0.016', 'AMMO5': '0.020', 'ARMOR': '0.024', 'AMMO4': '0.082', 'AMMO3': '0.122', 'HITCOUNT': '0.140', 'weapon5': '0.160', 'WEAPON5': '0.350', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.122', 'weapon2': '1.498', 'weapon3': '1.822'} +[2023-09-14 14:52:47,467][63576] Saving new best policy, reward=-3.647! +[2023-09-14 14:52:48,456][63805] DAMAGECOUNT value on done: 7896.0 +[2023-09-14 14:52:48,457][63805] Sum rewards: -0.949, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.192', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'weapon4': '0.020', 'AMMO2': '0.020', 'ARMOR': '0.048', 'weapon5': '0.088', 'WEAPON4': '0.100', 'AMMO4': '0.101', 'AMMO3': '0.116', 'WEAPON5': '0.250', 'HITCOUNT': '0.310', 'WEAPON3': '0.650', 'weapon3': '1.568', 'DAMAGECOUNT': '1.593', 'weapon2': '1.846', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:52:48,804][63805] DAMAGECOUNT value on done: 6929.0 +[2023-09-14 14:52:48,804][63805] Sum rewards: 1.751, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.226', 'AMMO4': '-0.043', 'AMMO2': '-0.009', 'AMMO5': '0.009', 'WEAPON1': '0.010', 'ARMOR': '0.016', 'weapon5': '0.074', 'AMMO3': '0.114', 'weapon7': '0.136', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'AMMO6': '0.240', 'AMMO7': '0.240', 'WEAPON7': '0.400', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.014', 'weapon2': '1.274', 'weapon3': '1.982', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:52:48,929][63732] Updated weights for policy 0, policy_version 1350 (0.0010) +[2023-09-14 14:52:50,916][63733] Updated weights for policy 1, policy_version 1300 (0.0011) +[2023-09-14 14:52:51,450][63734] DAMAGECOUNT value on done: 7189.0 +[2023-09-14 14:52:51,450][63734] Sum rewards: -4.637, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.520', 'AMMO4': '-0.031', 'AMMO2': '-0.006', 'AMMO5': '0.003', 'ARMOR': '0.040', 'weapon5': '0.060', 'WEAPON5': '0.100', 'AMMO3': '0.115', 'HITCOUNT': '0.200', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.074', 'weapon3': '1.470', 'weapon2': '1.858'} +[2023-09-14 14:52:51,895][63734] DAMAGECOUNT value on done: 6199.0 +[2023-09-14 14:52:51,896][63734] Sum rewards: -6.061, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.959', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'AMMO5': '0.008', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'weapon5': '0.062', 'weapon4': '0.080', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON5': '0.150', 'AMMO3': '0.177', 'HITCOUNT': '0.320', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.155', 'weapon3': '1.504', 'weapon2': '1.808', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:52:51,906][63771] DAMAGECOUNT value on done: 7559.0 +[2023-09-14 14:52:51,907][63771] Sum rewards: -3.501, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.990', 'AMMO2': '0.004', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.018', 'weapon5': '0.046', 'AMMO3': '0.146', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'ARMOR': '0.424', 'DAMAGECOUNT': '0.705', 'WEAPON3': '0.900', 'weapon2': '1.090', 'FRAGCOUNT': '2.000', 'weapon3': '2.226'} +[2023-09-14 14:52:52,240][63771] DAMAGECOUNT value on done: 5111.0 +[2023-09-14 14:52:52,241][63771] Sum rewards: -3.077, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.575', 'AMMO2': '0.002', 'AMMO4': '0.008', 'AMMO5': '0.009', 'ARMOR': '0.016', 'WEAPON1': '0.020', 'AMMO3': '0.075', 'weapon5': '0.112', 'HITCOUNT': '0.140', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'weapon4': '0.230', 'WEAPON3': '0.400', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.702', 'weapon3': '0.972', 'weapon2': '1.712'} +[2023-09-14 14:52:54,989][63806] DAMAGECOUNT value on done: 6675.0 +[2023-09-14 14:52:54,990][63806] Sum rewards: -4.429, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.106', 'AMMO4': '-0.034', 'AMMO2': '-0.007', 'AMMO5': '0.017', 'ARMOR': '0.020', 'weapon5': '0.176', 'AMMO3': '0.184', 'WEAPON5': '0.350', 'HITCOUNT': '0.400', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.404', 'weapon2': '1.540', 'weapon3': '1.776'} +[2023-09-14 14:52:55,328][63806] DAMAGECOUNT value on done: 6257.0 +[2023-09-14 14:52:55,328][63806] Sum rewards: -1.617, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.848', 'AMMO5': '0.015', 'weapon5': '0.028', 'AMMO2': '0.039', 'HITCOUNT': '0.120', 'AMMO3': '0.143', 'AMMO4': '0.193', 'WEAPON4': '0.200', 'weapon4': '0.222', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.390', 'ARMOR': '0.400', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.024', 'weapon3': '1.858'} +[2023-09-14 14:52:55,358][63769] DAMAGECOUNT value on done: 6185.0 +[2023-09-14 14:52:55,359][63769] Sum rewards: -3.608, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.180', 'AMMO2': '0.002', 'AMMO4': '0.008', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'weapon5': '0.072', 'AMMO3': '0.106', 'HITCOUNT': '0.140', 'weapon7': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.376', 'AMMO6': '0.420', 'AMMO7': '0.420', 'DAMAGECOUNT': '0.447', 'WEAPON7': '0.500', 'WEAPON3': '0.600', 'weapon3': '0.894', 'weapon2': '1.592', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:52:55,613][63732] Updated weights for policy 0, policy_version 1360 (0.0011) +[2023-09-14 14:52:55,844][63769] DAMAGECOUNT value on done: 6807.0 +[2023-09-14 14:52:56,676][63735] DAMAGECOUNT value on done: 7000.0 +[2023-09-14 14:52:56,676][63735] Sum rewards: -6.758, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.684', 'FRAGCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.014', 'AMMO4': '0.022', 'ARMOR': '0.028', 'AMMO3': '0.170', 'weapon5': '0.260', 'WEAPON5': '0.300', 'HITCOUNT': '0.370', 'WEAPON3': '0.800', 'weapon2': '1.344', 'DAMAGECOUNT': '1.431', 'weapon3': '1.932'} +[2023-09-14 14:52:57,041][63735] DAMAGECOUNT value on done: 6906.0 +[2023-09-14 14:52:57,042][63735] Sum rewards: 0.212, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.716', 'AMMO2': '0.010', 'AMMO5': '0.022', 'WEAPON1': '0.030', 'AMMO4': '0.049', 'AMMO3': '0.182', 'weapon5': '0.292', 'HITCOUNT': '0.370', 'WEAPON5': '0.450', 'WEAPON3': '1.000', 'weapon2': '1.156', 'weapon3': '2.012', 'DAMAGECOUNT': '2.355', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:52:58,785][63733] Updated weights for policy 1, policy_version 1310 (0.0011) +[2023-09-14 14:52:58,875][63770] DAMAGECOUNT value on done: 7617.0 +[2023-09-14 14:52:59,284][63770] DAMAGECOUNT value on done: 4627.0 +[2023-09-14 14:52:59,284][63770] Sum rewards: -0.023, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.572', 'AMMO2': '0.007', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'weapon4': '0.012', 'AMMO4': '0.037', 'WEAPON4': '0.050', 'weapon5': '0.074', 'AMMO3': '0.132', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'ARMOR': '0.445', 'DAMAGECOUNT': '0.546', 'WEAPON3': '0.700', 'weapon3': '1.502', 'weapon2': '1.904', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:53:01,310][63767] DAMAGECOUNT value on done: 7237.0 +[2023-09-14 14:53:01,311][63767] Sum rewards: -5.067, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.000', 'HEALTH': '-0.340', 'AMMO5': '0.005', 'AMMO2': '0.018', 'WEAPON1': '0.030', 'AMMO4': '0.088', 'AMMO3': '0.088', 'WEAPON5': '0.100', 'HITCOUNT': '0.130', 'weapon5': '0.244', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.450', 'weapon3': '1.092', 'weapon2': '1.888'} +[2023-09-14 14:53:01,653][63767] DAMAGECOUNT value on done: 7025.0 +[2023-09-14 14:53:01,653][63767] Sum rewards: -7.776, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.972', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.007', 'AMMO2': '0.018', 'WEAPON1': '0.030', 'AMMO3': '0.059', 'HITCOUNT': '0.060', 'AMMO4': '0.089', 'weapon5': '0.130', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon4': '0.160', 'DAMAGECOUNT': '0.225', 'ARMOR': '0.432', 'WEAPON3': '0.450', 'weapon3': '0.834', 'weapon2': '1.902'} +[2023-09-14 14:53:02,485][63732] Updated weights for policy 0, policy_version 1370 (0.0010) +[2023-09-14 14:53:04,172][63771] DAMAGECOUNT value on done: 4148.0 +[2023-09-14 14:53:04,173][63771] Sum rewards: -0.235, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.062', 'AMMO5': '0.014', 'ARMOR': '0.028', 'AMMO2': '0.028', 'WEAPON4': '0.100', 'weapon5': '0.126', 'AMMO3': '0.130', 'AMMO4': '0.140', 'HITCOUNT': '0.230', 'WEAPON5': '0.300', 'weapon4': '0.392', 'DAMAGECOUNT': '0.654', 'WEAPON3': '0.750', 'weapon2': '1.138', 'weapon3': '1.796', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:53:04,187][63805] DAMAGECOUNT value on done: 8717.0 +[2023-09-14 14:53:04,188][63805] Sum rewards: -3.777, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.807', 'AMMO5': '0.010', 'AMMO2': '0.024', 'AMMO4': '0.117', 'HITCOUNT': '0.140', 'AMMO3': '0.151', 'weapon5': '0.222', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'weapon4': '0.308', 'ARMOR': '0.444', 'DAMAGECOUNT': '0.672', 'WEAPON3': '0.800', 'weapon2': '0.962', 'FRAGCOUNT': '1.000', 'weapon3': '1.630'} +[2023-09-14 14:53:04,578][63771] DAMAGECOUNT value on done: 6546.0 +[2023-09-14 14:53:04,579][63771] Sum rewards: -2.509, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.001', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.018', 'ARMOR': '0.064', 'AMMO4': '0.092', 'WEAPON4': '0.100', 'weapon4': '0.138', 'AMMO3': '0.158', 'HITCOUNT': '0.180', 'weapon5': '0.190', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.714', 'FRAGCOUNT': '1.500', 'weapon2': '1.568', 'weapon3': '1.598'} +[2023-09-14 14:53:04,580][63805] DAMAGECOUNT value on done: 5145.0 +[2023-09-14 14:53:04,580][63805] Sum rewards: -2.819, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.418', 'AMMO5': '0.005', 'AMMO2': '0.008', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'AMMO4': '0.039', 'weapon5': '0.062', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.107', 'HITCOUNT': '0.120', 'weapon4': '0.162', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.522', 'weapon3': '1.568'} +[2023-09-14 14:53:04,808][63735] DAMAGECOUNT value on done: 7317.0 +[2023-09-14 14:53:04,809][63735] Sum rewards: -5.088, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.876', 'AMMO5': '0.017', 'AMMO2': '0.018', 'HITCOUNT': '0.070', 'AMMO4': '0.087', 'AMMO3': '0.112', 'weapon5': '0.176', 'DAMAGECOUNT': '0.225', 'WEAPON4': '0.250', 'WEAPON5': '0.300', 'weapon4': '0.306', 'ARMOR': '0.436', 'WEAPON3': '0.600', 'weapon2': '1.346', 'weapon3': '1.594'} +[2023-09-14 14:53:04,861][63769] DAMAGECOUNT value on done: 7626.0 +[2023-09-14 14:53:04,862][63769] Sum rewards: -7.164, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.344', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO2': '0.012', 'ARMOR': '0.020', 'WEAPON1': '0.040', 'weapon4': '0.044', 'AMMO4': '0.059', 'WEAPON5': '0.100', 'WEAPON4': '0.150', 'AMMO3': '0.230', 'HITCOUNT': '0.290', 'DAMAGECOUNT': '0.948', 'WEAPON3': '1.250', 'weapon2': '1.368', 'FRAGCOUNT': '2.000', 'weapon3': '2.158'} +[2023-09-14 14:53:05,199][63735] DAMAGECOUNT value on done: 4378.0 +[2023-09-14 14:53:05,200][63735] Sum rewards: -1.677, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.332', 'AMMO2': '0.006', 'AMMO5': '0.013', 'AMMO4': '0.030', 'WEAPON4': '0.050', 'weapon4': '0.090', 'HITCOUNT': '0.130', 'AMMO3': '0.138', 'weapon5': '0.194', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.850', 'weapon2': '1.348', 'weapon3': '1.986', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:53:05,219][63734] DAMAGECOUNT value on done: 6576.0 +[2023-09-14 14:53:05,220][63734] Sum rewards: -1.208, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.076', 'AMMO5': '0.003', 'AMMO2': '0.006', 'ARMOR': '0.020', 'AMMO4': '0.029', 'WEAPON5': '0.050', 'weapon7': '0.066', 'AMMO3': '0.069', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'HITCOUNT': '0.170', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.648', 'weapon3': '0.890', 'weapon2': '1.668', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:53:05,248][63769] DAMAGECOUNT value on done: 5726.0 +[2023-09-14 14:53:05,248][63769] Sum rewards: -5.028, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.828', 'AMMO2': '0.004', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO4': '0.021', 'ARMOR': '0.033', 'AMMO3': '0.103', 'WEAPON5': '0.150', 'HITCOUNT': '0.270', 'weapon5': '0.292', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.843', 'weapon2': '1.432', 'weapon3': '1.672'} +[2023-09-14 14:53:05,612][63734] DAMAGECOUNT value on done: 5339.0 +[2023-09-14 14:53:05,613][63734] Sum rewards: -1.505, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.419', 'AMMO5': '0.005', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'AMMO4': '0.039', 'AMMO3': '0.100', 'ARMOR': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.100', 'HITCOUNT': '0.140', 'weapon5': '0.140', 'WEAPON5': '0.150', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.660', 'FRAGCOUNT': '1.000', 'weapon3': '1.498', 'weapon2': '1.814'} +[2023-09-14 14:53:05,889][63806] DAMAGECOUNT value on done: 4997.0 +[2023-09-14 14:53:05,889][63806] Sum rewards: -4.900, reward structure: {'DEATHCOUNT': '-11.250', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO2': '0.023', 'weapon5': '0.042', 'ARMOR': '0.056', 'AMMO3': '0.092', 'AMMO4': '0.112', 'HEALTH': '0.148', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'weapon4': '0.344', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.298', 'weapon2': '1.630'} +[2023-09-14 14:53:06,214][63806] DAMAGECOUNT value on done: 8174.0 +[2023-09-14 14:53:06,215][63806] Sum rewards: -4.299, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.410', 'ARMOR': '0.008', 'AMMO5': '0.012', 'AMMO2': '0.015', 'weapon5': '0.064', 'AMMO4': '0.075', 'AMMO3': '0.085', 'WEAPON5': '0.100', 'weapon4': '0.146', 'HITCOUNT': '0.250', 'WEAPON4': '0.250', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.915', 'weapon3': '1.262', 'weapon2': '1.828', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:53:06,477][63733] Updated weights for policy 1, policy_version 1320 (0.0010) +[2023-09-14 14:53:07,466][63576] Saving new best policy, reward=-3.612! +[2023-09-14 14:53:08,786][63767] DAMAGECOUNT value on done: 8680.0 +[2023-09-14 14:53:08,787][63767] Sum rewards: 4.721, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.013', 'AMMO5': '0.010', 'AMMO2': '0.032', 'AMMO3': '0.056', 'WEAPON5': '0.150', 'AMMO4': '0.161', 'WEAPON4': '0.250', 'HITCOUNT': '0.290', 'WEAPON3': '0.300', 'weapon5': '0.332', 'ARMOR': '0.432', 'weapon4': '0.668', 'weapon3': '0.684', 'DAMAGECOUNT': '1.263', 'weapon2': '1.356', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:53:09,127][63767] DAMAGECOUNT value on done: 8554.0 +[2023-09-14 14:53:09,127][63767] Sum rewards: -3.832, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.244', 'AMMO5': '0.007', 'ARMOR': '0.020', 'WEAPON1': '0.020', 'AMMO2': '0.028', 'weapon5': '0.044', 'AMMO3': '0.130', 'AMMO4': '0.142', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon4': '0.262', 'HITCOUNT': '0.300', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.020', 'weapon2': '1.512', 'weapon3': '1.526'} +[2023-09-14 14:53:09,940][63732] Updated weights for policy 0, policy_version 1380 (0.0010) +[2023-09-14 14:53:10,614][63770] DAMAGECOUNT value on done: 5841.0 +[2023-09-14 14:53:10,615][63770] Sum rewards: -4.404, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.252', 'AMMO5': '0.005', 'AMMO2': '0.014', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'weapon5': '0.046', 'weapon4': '0.062', 'AMMO4': '0.071', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.133', 'weapon7': '0.184', 'HITCOUNT': '0.210', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.801', 'WEAPON3': '0.850', 'weapon2': '1.334', 'weapon3': '1.818'} +[2023-09-14 14:53:11,018][63770] DAMAGECOUNT value on done: 6776.0 +[2023-09-14 14:53:11,018][63770] Sum rewards: -3.679, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.732', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'AMMO2': '0.022', 'WEAPON5': '0.050', 'ARMOR': '0.072', 'weapon7': '0.092', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO4': '0.110', 'AMMO3': '0.167', 'weapon5': '0.194', 'HITCOUNT': '0.240', 'WEAPON4': '0.250', 'weapon4': '0.408', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.119', 'weapon2': '1.304', 'weapon3': '1.452'} +[2023-09-14 14:53:11,739][63805] DAMAGECOUNT value on done: 8512.0 +[2023-09-14 14:53:11,740][63805] Sum rewards: -0.836, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.963', 'AMMO2': '0.008', 'ARMOR': '0.008', 'AMMO5': '0.020', 'WEAPON1': '0.020', 'AMMO4': '0.039', 'WEAPON4': '0.050', 'weapon4': '0.080', 'AMMO3': '0.122', 'weapon5': '0.146', 'WEAPON5': '0.400', 'HITCOUNT': '0.440', 'WEAPON3': '0.750', 'weapon2': '1.338', 'DAMAGECOUNT': '1.848', 'weapon3': '1.858', 'FRAGCOUNT': '3.500'} +[2023-09-14 14:53:12,080][63805] DAMAGECOUNT value on done: 7725.0 +[2023-09-14 14:53:12,080][63805] Sum rewards: 2.175, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.870', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.021', 'ARMOR': '0.044', 'weapon5': '0.092', 'AMMO3': '0.099', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.104', 'weapon7': '0.110', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'weapon4': '0.226', 'WEAPON3': '0.600', 'weapon2': '1.434', 'weapon3': '1.480', 'DAMAGECOUNT': '1.500', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:53:13,225][63733] Updated weights for policy 1, policy_version 1330 (0.0010) +[2023-09-14 14:53:15,099][63771] DAMAGECOUNT value on done: 7804.0 +[2023-09-14 14:53:15,100][63771] Sum rewards: -3.412, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.150', 'AMMO2': '0.006', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.029', 'ARMOR': '0.084', 'AMMO3': '0.118', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'weapon5': '0.182', 'WEAPON4': '0.200', 'weapon4': '0.284', 'DAMAGECOUNT': '0.735', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.320', 'weapon3': '1.632'} +[2023-09-14 14:53:15,508][63771] DAMAGECOUNT value on done: 5169.0 +[2023-09-14 14:53:16,671][63734] DAMAGECOUNT value on done: 7359.0 +[2023-09-14 14:53:16,671][63734] Sum rewards: -1.837, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.856', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.018', 'ARMOR': '0.036', 'AMMO3': '0.066', 'AMMO4': '0.089', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon5': '0.152', 'weapon4': '0.192', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.510', 'weapon3': '0.934', 'FRAGCOUNT': '1.000', 'weapon2': '1.900'} +[2023-09-14 14:53:17,061][63734] DAMAGECOUNT value on done: 6369.0 +[2023-09-14 14:53:17,062][63734] Sum rewards: -2.528, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.429', 'AMMO2': '0.010', 'AMMO5': '0.027', 'AMMO4': '0.052', 'WEAPON4': '0.100', 'AMMO3': '0.117', 'HITCOUNT': '0.140', 'weapon5': '0.174', 'weapon4': '0.270', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.510', 'ARMOR': '0.559', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.332', 'weapon3': '1.610'} +[2023-09-14 14:53:17,467][63576] Saving new best policy, reward=-3.477! +[2023-09-14 14:53:17,573][63732] Updated weights for policy 0, policy_version 1390 (0.0011) +[2023-09-14 14:53:17,751][63806] DAMAGECOUNT value on done: 7150.0 +[2023-09-14 14:53:17,751][63806] Sum rewards: -3.673, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.118', 'AMMO2': '0.013', 'AMMO5': '0.017', 'ARMOR': '0.032', 'weapon5': '0.050', 'AMMO4': '0.066', 'WEAPON4': '0.100', 'AMMO3': '0.170', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'weapon4': '0.342', 'weapon2': '1.088', 'WEAPON3': '1.100', 'DAMAGECOUNT': '1.425', 'FRAGCOUNT': '2.000', 'weapon3': '2.032'} +[2023-09-14 14:53:18,081][63806] DAMAGECOUNT value on done: 6596.0 +[2023-09-14 14:53:18,082][63806] Sum rewards: -2.430, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.729', 'AMMO5': '0.005', 'AMMO2': '0.018', 'WEAPON5': '0.050', 'weapon5': '0.060', 'AMMO4': '0.087', 'AMMO3': '0.151', 'HITCOUNT': '0.200', 'WEAPON4': '0.400', 'FRAGCOUNT': '0.500', 'weapon2': '0.530', 'weapon4': '0.670', 'WEAPON3': '0.850', 'ARMOR': '0.971', 'DAMAGECOUNT': '1.017', 'weapon3': '2.040'} +[2023-09-14 14:53:19,956][63735] DAMAGECOUNT value on done: 7175.0 +[2023-09-14 14:53:19,957][63735] Sum rewards: -4.859, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.480', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.008', 'weapon7': '0.068', 'WEAPON4': '0.100', 'weapon5': '0.108', 'weapon4': '0.112', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.136', 'HITCOUNT': '0.150', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.525', 'WEAPON3': '0.750', 'weapon2': '1.118', 'weapon3': '1.666'} +[2023-09-14 14:53:20,270][63733] Updated weights for policy 1, policy_version 1340 (0.0010) +[2023-09-14 14:53:20,299][63735] DAMAGECOUNT value on done: 7160.0 +[2023-09-14 14:53:20,299][63735] Sum rewards: -2.036, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.965', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'weapon4': '0.012', 'AMMO2': '0.012', 'weapon5': '0.024', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'AMMO4': '0.061', 'AMMO3': '0.118', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.762', 'weapon2': '1.648', 'weapon3': '1.888', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:53:20,615][63769] DAMAGECOUNT value on done: 6735.0 +[2023-09-14 14:53:20,616][63769] Sum rewards: -5.358, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.808', 'AMMO4': '-0.014', 'AMMO2': '-0.003', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'weapon7': '0.070', 'weapon5': '0.104', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.135', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.330', 'WEAPON3': '0.700', 'weapon2': '1.466', 'FRAGCOUNT': '1.500', 'weapon3': '1.592', 'DAMAGECOUNT': '1.650'} +[2023-09-14 14:53:21,008][63769] DAMAGECOUNT value on done: 7028.0 +[2023-09-14 14:53:21,008][63769] Sum rewards: -0.119, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO2': '0.031', 'WEAPON4': '0.100', 'AMMO3': '0.125', 'AMMO4': '0.154', 'HEALTH': '0.224', 'HITCOUNT': '0.240', 'weapon4': '0.404', 'ARMOR': '0.460', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.663', 'weapon2': '1.538', 'weapon3': '1.542', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:53:24,284][63767] DAMAGECOUNT value on done: 7642.0 +[2023-09-14 14:53:24,284][63767] Sum rewards: 0.887, reward structure: {'DEATHCOUNT': '-9.000', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'AMMO2': '0.024', 'weapon5': '0.098', 'AMMO3': '0.104', 'AMMO4': '0.120', 'weapon4': '0.150', 'HEALTH': '0.156', 'WEAPON4': '0.250', 'HITCOUNT': '0.300', 'WEAPON5': '0.300', 'ARMOR': '0.412', 'WEAPON3': '0.550', 'DAMAGECOUNT': '1.215', 'weapon2': '1.516', 'weapon3': '1.664', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:53:24,426][63770] DAMAGECOUNT value on done: 8162.0 +[2023-09-14 14:53:24,426][63770] Sum rewards: 1.760, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.264', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'AMMO5': '0.015', 'ARMOR': '0.060', 'weapon5': '0.080', 'AMMO3': '0.139', 'WEAPON5': '0.300', 'HITCOUNT': '0.320', 'WEAPON3': '0.800', 'weapon2': '1.472', 'DAMAGECOUNT': '1.635', 'weapon3': '1.960', 'FRAGCOUNT': '6.000'} +[2023-09-14 14:53:24,614][63732] Updated weights for policy 0, policy_version 1400 (0.0011) +[2023-09-14 14:53:24,625][63767] DAMAGECOUNT value on done: 7135.0 +[2023-09-14 14:53:24,904][63770] DAMAGECOUNT value on done: 5259.0 +[2023-09-14 14:53:24,905][63770] Sum rewards: 1.179, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.718', 'AMMO2': '0.011', 'AMMO4': '0.053', 'ARMOR': '0.064', 'AMMO3': '0.125', 'WEAPON4': '0.200', 'weapon4': '0.220', 'HITCOUNT': '0.470', 'WEAPON3': '0.850', 'weapon2': '1.368', 'weapon3': '1.890', 'DAMAGECOUNT': '1.896', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:53:27,436][63805] DAMAGECOUNT value on done: 8927.0 +[2023-09-14 14:53:27,454][63771] DAMAGECOUNT value on done: 4363.0 +[2023-09-14 14:53:27,455][63771] Sum rewards: 0.428, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.462', 'AMMO2': '0.004', 'AMMO5': '0.008', 'AMMO4': '0.022', 'WEAPON4': '0.050', 'AMMO3': '0.075', 'weapon5': '0.076', 'weapon4': '0.186', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.450', 'ARMOR': '0.507', 'DAMAGECOUNT': '0.645', 'weapon3': '1.586', 'weapon2': '1.630', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:53:27,467][63576] Saving new best policy, reward=-3.447! +[2023-09-14 14:53:27,783][63733] Updated weights for policy 1, policy_version 1350 (0.0011) +[2023-09-14 14:53:27,809][63771] DAMAGECOUNT value on done: 6916.0 +[2023-09-14 14:53:27,810][63771] Sum rewards: -0.823, reward structure: {'DEATHCOUNT': '-9.000', 'AMMO2': '0.014', 'AMMO5': '0.017', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO4': '0.069', 'AMMO3': '0.118', 'weapon5': '0.122', 'weapon4': '0.158', 'HITCOUNT': '0.240', 'HEALTH': '0.246', 'WEAPON5': '0.250', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.110', 'weapon2': '1.528', 'weapon3': '1.590', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:53:27,813][63805] DAMAGECOUNT value on done: 5495.0 +[2023-09-14 14:53:27,813][63805] Sum rewards: -0.665, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.120', 'AMMO2': '0.002', 'AMMO5': '0.010', 'AMMO4': '0.010', 'WEAPON1': '0.030', 'weapon4': '0.074', 'WEAPON4': '0.100', 'AMMO3': '0.121', 'weapon5': '0.146', 'WEAPON5': '0.150', 'HITCOUNT': '0.240', 'ARMOR': '0.445', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.050', 'weapon3': '1.676', 'weapon2': '1.700', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:53:28,083][63735] DAMAGECOUNT value on done: 7377.0 +[2023-09-14 14:53:28,283][63769] DAMAGECOUNT value on done: 7780.0 +[2023-09-14 14:53:28,283][63769] Sum rewards: -2.167, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.114', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.020', 'AMMO4': '0.099', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'WEAPON5': '0.150', 'HITCOUNT': '0.160', 'weapon4': '0.162', 'weapon5': '0.234', 'ARMOR': '0.436', 'DAMAGECOUNT': '0.462', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.014', 'weapon2': '1.734'} +[2023-09-14 14:53:28,421][63735] DAMAGECOUNT value on done: 4613.0 +[2023-09-14 14:53:28,422][63735] Sum rewards: -1.641, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.740', 'AMMO5': '0.007', 'AMMO2': '0.020', 'WEAPON1': '0.030', 'ARMOR': '0.032', 'AMMO4': '0.098', 'AMMO3': '0.111', 'weapon5': '0.148', 'WEAPON5': '0.150', 'HITCOUNT': '0.200', 'weapon4': '0.238', 'WEAPON4': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.705', 'FRAGCOUNT': '1.000', 'weapon2': '1.466', 'weapon3': '1.594'} +[2023-09-14 14:53:28,674][63769] DAMAGECOUNT value on done: 5760.0 +[2023-09-14 14:53:28,810][63806] DAMAGECOUNT value on done: 5027.0 +[2023-09-14 14:53:28,811][63806] Sum rewards: -3.113, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.011', 'AMMO5': '0.017', 'WEAPON1': '0.040', 'HITCOUNT': '0.040', 'AMMO4': '0.055', 'AMMO3': '0.067', 'DAMAGECOUNT': '0.090', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.118', 'WEAPON5': '0.300', 'HEALTH': '0.332', 'weapon5': '0.342', 'WEAPON3': '0.400', 'weapon3': '0.912', 'weapon2': '1.112'} +[2023-09-14 14:53:29,150][63806] DAMAGECOUNT value on done: 8363.0 +[2023-09-14 14:53:29,150][63806] Sum rewards: 0.655, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.940', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.040', 'AMMO3': '0.068', 'WEAPON4': '0.100', 'HITCOUNT': '0.170', 'weapon4': '0.216', 'WEAPON5': '0.300', 'weapon5': '0.358', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.567', 'FRAGCOUNT': '1.000', 'weapon2': '1.314', 'weapon3': '1.404'} +[2023-09-14 14:53:30,361][63734] DAMAGECOUNT value on done: 6742.0 +[2023-09-14 14:53:30,361][63734] Sum rewards: -2.257, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.040', 'AMMO5': '0.005', 'AMMO2': '0.019', 'ARMOR': '0.052', 'AMMO3': '0.080', 'weapon5': '0.084', 'AMMO4': '0.093', 'WEAPON5': '0.100', 'HITCOUNT': '0.210', 'weapon4': '0.238', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.498', 'FRAGCOUNT': '1.000', 'weapon3': '1.342', 'weapon2': '1.862'} +[2023-09-14 14:53:30,760][63734] DAMAGECOUNT value on done: 5459.0 +[2023-09-14 14:53:31,350][63732] Updated weights for policy 0, policy_version 1410 (0.0011) +[2023-09-14 14:53:31,740][63767] DAMAGECOUNT value on done: 8825.0 +[2023-09-14 14:53:32,142][63767] DAMAGECOUNT value on done: 8929.0 +[2023-09-14 14:53:32,142][63767] Sum rewards: -4.175, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.892', 'ARMOR': '0.005', 'AMMO2': '0.010', 'AMMO5': '0.015', 'AMMO4': '0.051', 'weapon5': '0.132', 'AMMO3': '0.166', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.404', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.125', 'weapon3': '1.422', 'weapon2': '1.456', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:53:32,461][63576] Saving new best policy, reward=-3.310! +[2023-09-14 14:53:34,942][63805] DAMAGECOUNT value on done: 8547.0 +[2023-09-14 14:53:34,942][63805] Sum rewards: -4.295, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.480', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'ARMOR': '0.012', 'AMMO2': '0.018', 'HITCOUNT': '0.040', 'weapon5': '0.056', 'AMMO4': '0.087', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.105', 'AMMO3': '0.118', 'WEAPON5': '0.150', 'weapon4': '0.184', 'WEAPON3': '0.600', 'weapon3': '1.222', 'weapon2': '1.726'} +[2023-09-14 14:53:35,269][63805] DAMAGECOUNT value on done: 7820.0 +[2023-09-14 14:53:35,269][63805] Sum rewards: -1.522, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.790', 'weapon5': '0.014', 'AMMO5': '0.015', 'AMMO2': '0.023', 'ARMOR': '0.080', 'HITCOUNT': '0.110', 'AMMO4': '0.114', 'AMMO3': '0.131', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.285', 'WEAPON4': '0.300', 'weapon4': '0.590', 'WEAPON3': '0.700', 'weapon2': '0.972', 'FRAGCOUNT': '1.000', 'weapon3': '1.534'} +[2023-09-14 14:53:35,406][63733] Updated weights for policy 1, policy_version 1360 (0.0012) +[2023-09-14 14:53:35,913][63770] DAMAGECOUNT value on done: 6330.0 +[2023-09-14 14:53:35,913][63770] Sum rewards: -4.393, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.160', 'AMMO2': '0.002', 'AMMO5': '0.008', 'AMMO4': '0.010', 'ARMOR': '0.012', 'WEAPON1': '0.050', 'WEAPON4': '0.050', 'weapon5': '0.140', 'weapon4': '0.142', 'WEAPON5': '0.150', 'AMMO3': '0.184', 'HITCOUNT': '0.400', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.467', 'weapon2': '1.480', 'FRAGCOUNT': '1.500', 'weapon3': '1.672'} +[2023-09-14 14:53:36,322][63770] DAMAGECOUNT value on done: 6781.0 +[2023-09-14 14:53:38,050][63732] Updated weights for policy 0, policy_version 1420 (0.0010) +[2023-09-14 14:53:38,168][63771] DAMAGECOUNT value on done: 7983.0 +[2023-09-14 14:53:38,565][63771] DAMAGECOUNT value on done: 5326.0 +[2023-09-14 14:53:38,566][63771] Sum rewards: -4.817, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.180', 'AMMO2': '0.006', 'AMMO5': '0.008', 'WEAPON1': '0.020', 'AMMO4': '0.028', 'ARMOR': '0.036', 'AMMO3': '0.080', 'weapon5': '0.122', 'WEAPON4': '0.150', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'weapon4': '0.292', 'DAMAGECOUNT': '0.471', 'WEAPON3': '0.500', 'weapon3': '1.404', 'weapon2': '1.636'} +[2023-09-14 14:53:40,166][63734] DAMAGECOUNT value on done: 7641.0 +[2023-09-14 14:53:40,167][63734] Sum rewards: -3.837, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.970', 'AMMO2': '0.007', 'ARMOR': '0.008', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.035', 'weapon5': '0.044', 'AMMO3': '0.114', 'WEAPON5': '0.150', 'weapon4': '0.214', 'WEAPON4': '0.250', 'HITCOUNT': '0.280', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.846', 'weapon2': '1.548', 'weapon3': '1.604', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:53:40,514][63734] DAMAGECOUNT value on done: 6625.0 +[2023-09-14 14:53:40,515][63734] Sum rewards: -3.042, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.496', 'AMMO2': '0.002', 'AMMO5': '0.003', 'AMMO4': '0.007', 'weapon5': '0.040', 'WEAPON5': '0.050', 'AMMO3': '0.114', 'HITCOUNT': '0.220', 'ARMOR': '0.416', 'DAMAGECOUNT': '0.768', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.286', 'weapon3': '1.998'} +[2023-09-14 14:53:40,542][63806] DAMAGECOUNT value on done: 7442.0 +[2023-09-14 14:53:40,542][63806] Sum rewards: 0.809, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.415', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'AMMO5': '0.010', 'AMMO3': '0.067', 'WEAPON4': '0.100', 'weapon5': '0.176', 'HITCOUNT': '0.190', 'WEAPON5': '0.250', 'weapon4': '0.254', 'ARMOR': '0.436', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.876', 'weapon3': '1.242', 'weapon2': '1.380', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:53:40,913][63806] DAMAGECOUNT value on done: 6725.0 +[2023-09-14 14:53:40,914][63806] Sum rewards: -6.061, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.494', 'AMMO5': '0.012', 'AMMO2': '0.016', 'AMMO4': '0.080', 'ARMOR': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.145', 'WEAPON4': '0.150', 'weapon5': '0.180', 'WEAPON5': '0.250', 'weapon4': '0.294', 'DAMAGECOUNT': '0.387', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.800', 'weapon2': '1.160', 'weapon3': '1.468'} +[2023-09-14 14:53:42,784][63735] DAMAGECOUNT value on done: 7256.0 +[2023-09-14 14:53:42,785][63735] Sum rewards: -4.269, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.296', 'AMMO5': '0.012', 'AMMO2': '0.024', 'weapon5': '0.036', 'HITCOUNT': '0.100', 'AMMO4': '0.118', 'AMMO3': '0.142', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.243', 'WEAPON5': '0.250', 'weapon4': '0.292', 'ARMOR': '0.464', 'WEAPON3': '0.650', 'weapon3': '0.714', 'FRAGCOUNT': '1.000', 'weapon2': '1.832'} +[2023-09-14 14:53:42,936][63733] Updated weights for policy 1, policy_version 1370 (0.0010) +[2023-09-14 14:53:43,100][63735] DAMAGECOUNT value on done: 7205.0 +[2023-09-14 14:53:44,055][63769] DAMAGECOUNT value on done: 7170.0 +[2023-09-14 14:53:44,056][63769] Sum rewards: 1.978, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.490', 'AMMO2': '0.012', 'AMMO5': '0.013', 'AMMO4': '0.062', 'ARMOR': '0.080', 'AMMO3': '0.101', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'weapon4': '0.228', 'HITCOUNT': '0.360', 'WEAPON3': '0.700', 'weapon2': '1.254', 'DAMAGECOUNT': '1.305', 'weapon3': '1.552', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:53:44,411][63769] DAMAGECOUNT value on done: 7154.0 +[2023-09-14 14:53:44,411][63769] Sum rewards: -8.196, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.550', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.007', 'AMMO2': '0.030', 'ARMOR': '0.051', 'HITCOUNT': '0.100', 'weapon5': '0.116', 'AMMO3': '0.127', 'WEAPON5': '0.150', 'AMMO4': '0.152', 'weapon4': '0.294', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.378', 'WEAPON3': '0.800', 'weapon2': '1.154', 'weapon3': '1.694'} +[2023-09-14 14:53:44,696][63732] Updated weights for policy 0, policy_version 1430 (0.0011) +[2023-09-14 14:53:47,062][63767] DAMAGECOUNT value on done: 7844.0 +[2023-09-14 14:53:47,446][63767] DAMAGECOUNT value on done: 7205.0 +[2023-09-14 14:53:49,761][63770] DAMAGECOUNT value on done: 8367.0 +[2023-09-14 14:53:49,762][63770] Sum rewards: -5.902, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.002', 'AMMO2': '0.002', 'AMMO5': '0.003', 'AMMO4': '0.009', 'WEAPON5': '0.050', 'weapon5': '0.064', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'AMMO3': '0.189', 'weapon4': '0.198', 'DAMAGECOUNT': '0.615', 'WEAPON3': '0.900', 'weapon3': '1.244', 'weapon2': '1.776', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:53:49,980][63805] DAMAGECOUNT value on done: 9157.0 +[2023-09-14 14:53:49,981][63805] Sum rewards: 4.400, reward structure: {'DEATHCOUNT': '-2.250', 'AMMO4': '-0.014', 'AMMO2': '-0.003', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO3': '0.040', 'WEAPON5': '0.050', 'HEALTH': '0.120', 'WEAPON3': '0.200', 'HITCOUNT': '0.200', 'ARMOR': '0.458', 'DAMAGECOUNT': '0.690', 'weapon2': '0.850', 'weapon3': '1.046', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:53:50,161][63770] DAMAGECOUNT value on done: 5688.0 +[2023-09-14 14:53:50,161][63770] Sum rewards: 1.116, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.743', 'AMMO5': '0.005', 'AMMO2': '0.011', 'weapon5': '0.042', 'WEAPON1': '0.050', 'AMMO4': '0.055', 'WEAPON5': '0.100', 'AMMO3': '0.101', 'WEAPON4': '0.150', 'weapon4': '0.216', 'HITCOUNT': '0.380', 'WEAPON3': '0.600', 'weapon2': '1.224', 'DAMAGECOUNT': '1.287', 'weapon3': '1.888', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:53:50,290][63733] Updated weights for policy 1, policy_version 1380 (0.0011) +[2023-09-14 14:53:50,322][63735] DAMAGECOUNT value on done: 7532.0 +[2023-09-14 14:53:50,374][63805] DAMAGECOUNT value on done: 5885.0 +[2023-09-14 14:53:50,374][63805] Sum rewards: -2.421, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.042', 'AMMO2': '0.002', 'AMMO4': '0.009', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'weapon5': '0.028', 'WEAPON4': '0.100', 'AMMO3': '0.117', 'weapon4': '0.236', 'WEAPON5': '0.250', 'HITCOUNT': '0.310', 'ARMOR': '0.432', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.170', 'weapon2': '1.460', 'weapon3': '1.720', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:53:50,512][63771] DAMAGECOUNT value on done: 4728.0 +[2023-09-14 14:53:50,513][63771] Sum rewards: 0.831, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.907', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.023', 'ARMOR': '0.040', 'AMMO3': '0.076', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.116', 'weapon5': '0.138', 'weapon4': '0.158', 'HITCOUNT': '0.260', 'WEAPON3': '0.450', 'DAMAGECOUNT': '1.095', 'weapon3': '1.390', 'FRAGCOUNT': '1.500', 'weapon2': '1.528'} +[2023-09-14 14:53:50,628][63735] DAMAGECOUNT value on done: 4813.0 +[2023-09-14 14:53:50,628][63735] Sum rewards: -0.656, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.395', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO2': '0.024', 'weapon5': '0.078', 'AMMO3': '0.098', 'AMMO4': '0.118', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon4': '0.214', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.600', 'weapon2': '1.210', 'weapon3': '1.870', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:53:50,921][63771] DAMAGECOUNT value on done: 7206.0 +[2023-09-14 14:53:50,922][63771] Sum rewards: -1.328, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.058', 'weapon5': '0.008', 'AMMO2': '0.011', 'AMMO5': '0.015', 'ARMOR': '0.036', 'AMMO4': '0.056', 'AMMO3': '0.078', 'weapon7': '0.102', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.240', 'WEAPON4': '0.250', 'weapon4': '0.306', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.870', 'FRAGCOUNT': '1.000', 'weapon3': '1.036', 'weapon2': '1.382'} +[2023-09-14 14:53:51,252][63769] DAMAGECOUNT value on done: 7991.0 +[2023-09-14 14:53:51,253][63769] Sum rewards: -2.830, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.742', 'AMMO2': '0.002', 'ARMOR': '0.004', 'AMMO4': '0.009', 'AMMO3': '0.102', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'weapon4': '0.196', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.633', 'weapon3': '1.432', 'weapon2': '1.954', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:53:51,439][63732] Updated weights for policy 0, policy_version 1440 (0.0011) +[2023-09-14 14:53:51,459][63806] DAMAGECOUNT value on done: 5402.0 +[2023-09-14 14:53:51,459][63806] Sum rewards: 0.199, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.324', 'AMMO2': '0.004', 'weapon5': '0.012', 'AMMO5': '0.015', 'AMMO4': '0.020', 'WEAPON1': '0.040', 'WEAPON4': '0.100', 'AMMO3': '0.139', 'weapon4': '0.148', 'WEAPON5': '0.300', 'HITCOUNT': '0.330', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.125', 'weapon2': '1.334', 'weapon3': '1.806', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:53:51,588][63769] DAMAGECOUNT value on done: 5956.0 +[2023-09-14 14:53:51,589][63769] Sum rewards: 1.154, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.772', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO2': '0.031', 'AMMO3': '0.092', 'HITCOUNT': '0.150', 'AMMO4': '0.154', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'weapon4': '0.296', 'weapon5': '0.372', 'DAMAGECOUNT': '0.588', 'WEAPON3': '0.650', 'ARMOR': '0.988', 'weapon2': '1.072', 'weapon3': '1.798', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:53:51,777][63806] DAMAGECOUNT value on done: 8463.0 +[2023-09-14 14:53:52,461][63576] Saving new best policy, reward=-3.056! +[2023-09-14 14:53:54,811][63767] DAMAGECOUNT value on done: 9060.0 +[2023-09-14 14:53:54,812][63767] Sum rewards: -2.013, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.216', 'AMMO5': '0.007', 'AMMO2': '0.015', 'WEAPON1': '0.020', 'weapon5': '0.048', 'AMMO4': '0.075', 'ARMOR': '0.104', 'AMMO3': '0.108', 'WEAPON5': '0.150', 'HITCOUNT': '0.220', 'WEAPON4': '0.300', 'weapon4': '0.560', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.705', 'FRAGCOUNT': '1.000', 'weapon2': '1.138', 'weapon3': '1.402'} +[2023-09-14 14:53:55,189][63767] DAMAGECOUNT value on done: 9138.0 +[2023-09-14 14:53:55,189][63767] Sum rewards: -7.100, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.426', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO2': '0.031', 'ARMOR': '0.040', 'WEAPON5': '0.100', 'AMMO3': '0.118', 'AMMO4': '0.153', 'HITCOUNT': '0.200', 'WEAPON4': '0.400', 'weapon4': '0.528', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.627', 'weapon3': '1.116', 'weapon2': '1.402'} +[2023-09-14 14:53:55,503][63734] DAMAGECOUNT value on done: 7171.0 +[2023-09-14 14:53:55,503][63734] Sum rewards: 2.022, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.632', 'AMMO4': '-0.003', 'AMMO2': '-0.000', 'AMMO5': '0.003', 'AMMO3': '0.099', 'WEAPON5': '0.100', 'weapon5': '0.142', 'WEAPON4': '0.150', 'HITCOUNT': '0.210', 'weapon4': '0.398', 'ARMOR': '0.452', 'WEAPON3': '0.500', 'weapon3': '1.206', 'DAMAGECOUNT': '1.287', 'weapon2': '1.610', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:53:55,910][63734] DAMAGECOUNT value on done: 5680.0 +[2023-09-14 14:53:55,911][63734] Sum rewards: -3.830, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.392', 'AMMO5': '0.007', 'AMMO2': '0.013', 'weapon5': '0.048', 'WEAPON1': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.062', 'weapon4': '0.102', 'AMMO3': '0.124', 'WEAPON5': '0.150', 'HITCOUNT': '0.180', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.663', 'ARMOR': '0.884', 'FRAGCOUNT': '1.000', 'weapon3': '1.424', 'weapon2': '1.654'} +[2023-09-14 14:53:57,864][63805] DAMAGECOUNT value on done: 8597.0 +[2023-09-14 14:53:58,037][63733] Updated weights for policy 1, policy_version 1390 (0.0011) +[2023-09-14 14:53:58,160][63732] Updated weights for policy 0, policy_version 1450 (0.0011) +[2023-09-14 14:53:58,244][63805] DAMAGECOUNT value on done: 8286.0 +[2023-09-14 14:53:58,245][63805] Sum rewards: -0.269, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.424', 'AMMO5': '0.005', 'AMMO2': '0.017', 'WEAPON5': '0.050', 'ARMOR': '0.068', 'AMMO4': '0.085', 'AMMO3': '0.099', 'weapon5': '0.118', 'WEAPON4': '0.200', 'HITCOUNT': '0.250', 'weapon4': '0.264', 'WEAPON3': '0.650', 'weapon2': '1.018', 'DAMAGECOUNT': '1.398', 'weapon3': '1.682', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:54:01,210][63771] DAMAGECOUNT value on done: 8278.0 +[2023-09-14 14:54:01,210][63771] Sum rewards: -2.753, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.166', 'AMMO5': '0.007', 'WEAPON1': '0.030', 'ARMOR': '0.032', 'AMMO2': '0.034', 'weapon4': '0.084', 'AMMO3': '0.137', 'WEAPON5': '0.150', 'AMMO4': '0.169', 'HITCOUNT': '0.200', 'weapon5': '0.206', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.885', 'weapon2': '0.898', 'WEAPON3': '0.900', 'FRAGCOUNT': '2.000', 'weapon3': '2.180'} +[2023-09-14 14:54:01,325][63770] DAMAGECOUNT value on done: 6390.0 +[2023-09-14 14:54:01,326][63770] Sum rewards: -3.123, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.542', 'AMMO2': '0.010', 'AMMO5': '0.010', 'weapon5': '0.022', 'AMMO4': '0.049', 'HITCOUNT': '0.050', 'ARMOR': '0.068', 'AMMO3': '0.114', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.180', 'WEAPON4': '0.250', 'weapon4': '0.394', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.278', 'weapon3': '1.594'} +[2023-09-14 14:54:01,550][63771] DAMAGECOUNT value on done: 5536.0 +[2023-09-14 14:54:01,550][63771] Sum rewards: -3.346, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.256', 'AMMO5': '0.007', 'weapon5': '0.018', 'AMMO2': '0.035', 'WEAPON1': '0.060', 'AMMO3': '0.126', 'WEAPON5': '0.150', 'HITCOUNT': '0.160', 'AMMO4': '0.177', 'weapon4': '0.276', 'WEAPON4': '0.400', 'ARMOR': '0.419', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.750', 'weapon2': '1.498', 'weapon3': '1.702', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:54:01,770][63770] DAMAGECOUNT value on done: 7061.0 +[2023-09-14 14:54:01,771][63770] Sum rewards: 0.121, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-1.390', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.012', 'weapon5': '0.070', 'AMMO3': '0.078', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'weapon4': '0.206', 'HITCOUNT': '0.210', 'ARMOR': '0.500', 'WEAPON3': '0.550', 'weapon2': '0.724', 'DAMAGECOUNT': '0.840', 'FRAGCOUNT': '1.000', 'weapon3': '1.508'} +[2023-09-14 14:54:03,055][63806] DAMAGECOUNT value on done: 7712.0 +[2023-09-14 14:54:03,055][63806] Sum rewards: -5.423, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.916', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.010', 'ARMOR': '0.017', 'AMMO2': '0.020', 'WEAPON1': '0.020', 'AMMO4': '0.099', 'WEAPON5': '0.150', 'AMMO3': '0.153', 'HITCOUNT': '0.180', 'weapon5': '0.186', 'WEAPON4': '0.300', 'weapon4': '0.368', 'DAMAGECOUNT': '0.810', 'WEAPON3': '0.950', 'weapon2': '1.184', 'weapon3': '1.546'} +[2023-09-14 14:54:03,373][63806] DAMAGECOUNT value on done: 7130.0 +[2023-09-14 14:54:03,373][63806] Sum rewards: -1.011, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.790', 'AMMO2': '0.012', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'AMMO4': '0.059', 'AMMO3': '0.105', 'weapon5': '0.118', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'HITCOUNT': '0.260', 'weapon4': '0.274', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.650', 'weapon2': '1.154', 'DAMAGECOUNT': '1.215', 'weapon3': '1.710'} +[2023-09-14 14:54:03,746][63734] DAMAGECOUNT value on done: 8004.0 +[2023-09-14 14:54:03,747][63734] Sum rewards: -5.254, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.700', 'AMMO5': '0.009', 'ARMOR': '0.012', 'AMMO2': '0.014', 'WEAPON1': '0.020', 'weapon7': '0.040', 'weapon5': '0.068', 'AMMO4': '0.068', 'AMMO6': '0.160', 'AMMO7': '0.160', 'AMMO3': '0.170', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.240', 'WEAPON4': '0.250', 'weapon4': '0.338', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.089', 'weapon3': '1.336', 'weapon2': '1.472'} +[2023-09-14 14:54:04,143][63734] DAMAGECOUNT value on done: 7247.0 +[2023-09-14 14:54:04,144][63734] Sum rewards: 0.334, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.188', 'AMMO2': '0.010', 'AMMO5': '0.022', 'WEAPON4': '0.050', 'ARMOR': '0.052', 'AMMO4': '0.052', 'weapon4': '0.068', 'AMMO3': '0.126', 'WEAPON5': '0.200', 'HITCOUNT': '0.340', 'weapon5': '0.398', 'WEAPON3': '0.600', 'weapon3': '1.426', 'weapon2': '1.560', 'DAMAGECOUNT': '1.866', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:54:04,844][63732] Updated weights for policy 0, policy_version 1460 (0.0010) +[2023-09-14 14:54:05,119][63735] DAMAGECOUNT value on done: 7579.0 +[2023-09-14 14:54:05,119][63735] Sum rewards: 1.333, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.636', 'AMMO4': '-0.008', 'AMMO2': '-0.001', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.048', 'weapon5': '0.050', 'AMMO3': '0.106', 'WEAPON4': '0.150', 'HITCOUNT': '0.290', 'weapon4': '0.316', 'WEAPON5': '0.350', 'WEAPON3': '0.750', 'weapon2': '0.808', 'DAMAGECOUNT': '0.969', 'weapon3': '2.104', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:54:05,452][63735] DAMAGECOUNT value on done: 7559.0 +[2023-09-14 14:54:05,453][63735] Sum rewards: -0.978, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.210', 'AMMO2': '0.000', 'AMMO4': '0.000', 'AMMO5': '0.013', 'weapon7': '0.018', 'AMMO3': '0.091', 'weapon5': '0.170', 'WEAPON4': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'weapon4': '0.360', 'WEAPON3': '0.700', 'ARMOR': '0.997', 'DAMAGECOUNT': '1.062', 'weapon2': '1.274', 'weapon3': '1.506', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:54:05,458][63733] Updated weights for policy 1, policy_version 1400 (0.0011) +[2023-09-14 14:54:07,281][63769] DAMAGECOUNT value on done: 7568.0 +[2023-09-14 14:54:07,282][63769] Sum rewards: 4.148, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.115', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.021', 'weapon5': '0.056', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.103', 'AMMO3': '0.108', 'weapon7': '0.154', 'WEAPON4': '0.250', 'HITCOUNT': '0.290', 'ARMOR': '0.476', 'weapon4': '0.530', 'WEAPON3': '0.600', 'weapon2': '1.170', 'DAMAGECOUNT': '1.194', 'weapon3': '1.396', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:54:07,684][63769] DAMAGECOUNT value on done: 7229.0 +[2023-09-14 14:54:07,684][63769] Sum rewards: -3.545, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.936', 'AMMO2': '0.016', 'AMMO5': '0.022', 'HITCOUNT': '0.070', 'AMMO4': '0.081', 'AMMO3': '0.120', 'weapon5': '0.150', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.225', 'WEAPON5': '0.300', 'ARMOR': '0.400', 'weapon4': '0.414', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.166', 'weapon2': '1.476'} +[2023-09-14 14:54:10,153][63767] DAMAGECOUNT value on done: 8436.0 +[2023-09-14 14:54:10,153][63767] Sum rewards: -0.186, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.143', 'AMMO4': '-0.018', 'AMMO2': '-0.003', 'ARMOR': '0.072', 'AMMO3': '0.192', 'HITCOUNT': '0.490', 'WEAPON3': '1.000', 'weapon2': '1.590', 'weapon3': '1.608', 'DAMAGECOUNT': '1.776', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:54:10,503][63767] DAMAGECOUNT value on done: 7410.0 +[2023-09-14 14:54:11,690][63732] Updated weights for policy 0, policy_version 1470 (0.0011) +[2023-09-14 14:54:12,461][63576] Saving new best policy, reward=-3.046! +[2023-09-14 14:54:12,740][63735] DAMAGECOUNT value on done: 7827.0 +[2023-09-14 14:54:12,741][63735] Sum rewards: -1.743, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.264', 'AMMO5': '0.015', 'AMMO2': '0.016', 'weapon4': '0.058', 'AMMO4': '0.081', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.130', 'HITCOUNT': '0.210', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.885', 'weapon3': '1.692', 'weapon2': '1.934', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:54:12,892][63805] DAMAGECOUNT value on done: 9562.0 +[2023-09-14 14:54:12,893][63805] Sum rewards: -0.313, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.112', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.015', 'ARMOR': '0.052', 'AMMO4': '0.075', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.110', 'weapon5': '0.132', 'weapon4': '0.210', 'HITCOUNT': '0.230', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.215', 'weapon2': '1.228', 'weapon3': '1.716', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:54:13,088][63735] DAMAGECOUNT value on done: 5113.0 +[2023-09-14 14:54:13,088][63735] Sum rewards: -2.378, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.049', 'ARMOR': '0.008', 'AMMO5': '0.015', 'AMMO2': '0.016', 'WEAPON1': '0.040', 'AMMO4': '0.081', 'AMMO3': '0.144', 'weapon5': '0.150', 'WEAPON4': '0.200', 'weapon4': '0.202', 'HITCOUNT': '0.270', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.900', 'weapon2': '0.936', 'WEAPON3': '0.950', 'FRAGCOUNT': '2.000', 'weapon3': '2.208'} +[2023-09-14 14:54:13,182][63733] Updated weights for policy 1, policy_version 1410 (0.0012) +[2023-09-14 14:54:13,296][63805] DAMAGECOUNT value on done: 6285.0 +[2023-09-14 14:54:13,297][63805] Sum rewards: -4.553, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.512', 'weapon5': '0.004', 'AMMO5': '0.013', 'AMMO2': '0.021', 'WEAPON1': '0.080', 'AMMO4': '0.105', 'AMMO3': '0.114', 'WEAPON5': '0.250', 'HITCOUNT': '0.270', 'WEAPON4': '0.300', 'ARMOR': '0.436', 'WEAPON3': '0.700', 'weapon4': '0.722', 'DAMAGECOUNT': '1.200', 'weapon3': '1.222', 'weapon2': '1.272', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:54:13,772][63806] DAMAGECOUNT value on done: 5694.0 +[2023-09-14 14:54:13,772][63806] Sum rewards: -2.164, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.613', 'WEAPON1': '0.010', 'AMMO2': '0.016', 'AMMO5': '0.018', 'ARMOR': '0.052', 'AMMO4': '0.081', 'AMMO3': '0.108', 'weapon5': '0.146', 'WEAPON4': '0.200', 'HITCOUNT': '0.200', 'WEAPON5': '0.300', 'weapon4': '0.340', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.876', 'FRAGCOUNT': '1.000', 'weapon2': '1.040', 'weapon3': '1.712'} +[2023-09-14 14:54:13,969][63771] DAMAGECOUNT value on done: 5058.0 +[2023-09-14 14:54:13,969][63771] Sum rewards: -3.800, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.798', 'AMMO2': '0.000', 'AMMO4': '0.001', 'weapon7': '0.002', 'AMMO5': '0.012', 'weapon5': '0.018', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.150', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.990', 'weapon2': '1.526', 'weapon3': '1.888', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:54:14,174][63806] DAMAGECOUNT value on done: 8628.0 +[2023-09-14 14:54:14,175][63806] Sum rewards: -6.068, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.910', 'AMMO2': '0.003', 'AMMO4': '0.013', 'AMMO5': '0.015', 'ARMOR': '0.032', 'AMMO3': '0.110', 'HITCOUNT': '0.110', 'weapon5': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.388', 'weapon3': '1.926'} +[2023-09-14 14:54:14,338][63771] DAMAGECOUNT value on done: 7356.0 +[2023-09-14 14:54:14,339][63771] Sum rewards: -4.200, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.630', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.010', 'AMMO2': '0.016', 'ARMOR': '0.032', 'AMMO4': '0.080', 'weapon5': '0.082', 'AMMO3': '0.146', 'HITCOUNT': '0.150', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon4': '0.412', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.750', 'weapon3': '1.338', 'weapon2': '1.464'} +[2023-09-14 14:54:14,374][63769] DAMAGECOUNT value on done: 8369.0 +[2023-09-14 14:54:14,374][63769] Sum rewards: -0.367, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.000', 'WEAPON1': '0.010', 'AMMO2': '0.012', 'AMMO5': '0.012', 'AMMO4': '0.058', 'weapon7': '0.076', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.130', 'WEAPON4': '0.150', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'HITCOUNT': '0.330', 'weapon4': '0.362', 'ARMOR': '0.449', 'WEAPON3': '0.800', 'weapon2': '1.110', 'DAMAGECOUNT': '1.134', 'weapon3': '1.810', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:54:14,790][63769] DAMAGECOUNT value on done: 6191.0 +[2023-09-14 14:54:14,790][63769] Sum rewards: -5.911, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.882', 'AMMO2': '0.004', 'AMMO5': '0.010', 'AMMO4': '0.017', 'WEAPON1': '0.020', 'weapon5': '0.028', 'AMMO3': '0.120', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'weapon4': '0.264', 'ARMOR': '0.521', 'DAMAGECOUNT': '0.705', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.468', 'weapon3': '1.654'} +[2023-09-14 14:54:15,224][63770] DAMAGECOUNT value on done: 8755.0 +[2023-09-14 14:54:15,225][63770] Sum rewards: 2.619, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.830', 'AMMO2': '0.011', 'AMMO4': '0.055', 'ARMOR': '0.090', 'AMMO3': '0.106', 'WEAPON4': '0.250', 'HITCOUNT': '0.280', 'weapon4': '0.530', 'WEAPON3': '0.650', 'weapon2': '0.662', 'DAMAGECOUNT': '1.164', 'weapon3': '1.900', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:54:15,651][63770] DAMAGECOUNT value on done: 6048.0 +[2023-09-14 14:54:15,651][63770] Sum rewards: -0.538, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.906', 'AMMO2': '0.011', 'AMMO5': '0.018', 'WEAPON1': '0.040', 'weapon5': '0.046', 'AMMO4': '0.052', 'AMMO3': '0.091', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'weapon4': '0.318', 'WEAPON3': '0.650', 'weapon2': '0.962', 'DAMAGECOUNT': '1.080', 'weapon3': '1.770', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:54:17,467][63576] Saving new best policy, reward=-2.917! +[2023-09-14 14:54:18,393][63767] DAMAGECOUNT value on done: 9275.0 +[2023-09-14 14:54:18,393][63767] Sum rewards: -2.343, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.718', 'AMMO5': '0.008', 'WEAPON1': '0.010', 'weapon5': '0.032', 'AMMO2': '0.035', 'ARMOR': '0.092', 'weapon4': '0.104', 'AMMO3': '0.112', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'AMMO4': '0.175', 'WEAPON4': '0.300', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.645', 'weapon2': '1.286', 'weapon3': '1.706'} +[2023-09-14 14:54:18,582][63732] Updated weights for policy 0, policy_version 1480 (0.0010) +[2023-09-14 14:54:18,774][63767] DAMAGECOUNT value on done: 9306.0 +[2023-09-14 14:54:18,775][63767] Sum rewards: -2.750, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.486', 'AMMO5': '0.008', 'AMMO2': '0.012', 'AMMO4': '0.060', 'ARMOR': '0.068', 'AMMO3': '0.103', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'weapon5': '0.194', 'weapon4': '0.380', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.504', 'FRAGCOUNT': '1.000', 'weapon3': '1.240', 'weapon2': '1.476'} +[2023-09-14 14:54:20,777][63733] Updated weights for policy 1, policy_version 1420 (0.0011) +[2023-09-14 14:54:21,084][63734] DAMAGECOUNT value on done: 7440.0 +[2023-09-14 14:54:21,084][63734] Sum rewards: -5.615, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.840', 'AMMO5': '0.010', 'AMMO2': '0.035', 'weapon5': '0.050', 'ARMOR': '0.072', 'AMMO3': '0.137', 'WEAPON5': '0.150', 'AMMO4': '0.174', 'HITCOUNT': '0.200', 'WEAPON4': '0.350', 'weapon4': '0.496', 'DAMAGECOUNT': '0.807', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.142', 'weapon3': '1.252'} +[2023-09-14 14:54:21,156][63805] DAMAGECOUNT value on done: 8760.0 +[2023-09-14 14:54:21,156][63805] Sum rewards: -3.665, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.482', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.008', 'weapon5': '0.050', 'WEAPON4': '0.100', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'weapon4': '0.154', 'AMMO3': '0.164', 'DAMAGECOUNT': '0.489', 'weapon2': '0.996', 'WEAPON3': '1.000', 'weapon3': '2.052', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:54:21,547][63734] DAMAGECOUNT value on done: 5904.0 +[2023-09-14 14:54:21,548][63734] Sum rewards: -4.988, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.704', 'ARMOR': '0.008', 'AMMO2': '0.028', 'AMMO3': '0.123', 'AMMO4': '0.139', 'HITCOUNT': '0.180', 'WEAPON4': '0.250', 'weapon4': '0.374', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.672', 'FRAGCOUNT': '1.000', 'weapon3': '1.360', 'weapon2': '1.432'} +[2023-09-14 14:54:21,560][63805] DAMAGECOUNT value on done: 8641.0 +[2023-09-14 14:54:24,370][63771] DAMAGECOUNT value on done: 8783.0 +[2023-09-14 14:54:24,371][63771] Sum rewards: -1.387, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.533', 'WEAPON1': '0.010', 'AMMO2': '0.014', 'AMMO5': '0.018', 'weapon5': '0.020', 'ARMOR': '0.036', 'AMMO4': '0.071', 'AMMO3': '0.138', 'WEAPON4': '0.150', 'weapon4': '0.270', 'WEAPON5': '0.350', 'HITCOUNT': '0.360', 'WEAPON3': '0.700', 'weapon2': '1.372', 'weapon3': '1.372', 'DAMAGECOUNT': '1.515', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:54:24,777][63771] DAMAGECOUNT value on done: 5977.0 +[2023-09-14 14:54:24,777][63771] Sum rewards: -3.170, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.046', 'weapon5': '0.008', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.010', 'AMMO4': '0.051', 'ARMOR': '0.060', 'AMMO3': '0.169', 'WEAPON5': '0.200', 'HITCOUNT': '0.340', 'WEAPON3': '0.950', 'weapon2': '1.216', 'DAMAGECOUNT': '1.323', 'weapon3': '2.028', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:54:25,337][63732] Updated weights for policy 0, policy_version 1490 (0.0010) +[2023-09-14 14:54:26,077][63806] DAMAGECOUNT value on done: 7966.0 +[2023-09-14 14:54:26,078][63806] Sum rewards: -2.565, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.965', 'AMMO2': '0.037', 'AMMO3': '0.112', 'ARMOR': '0.112', 'AMMO4': '0.183', 'HITCOUNT': '0.200', 'weapon4': '0.334', 'WEAPON4': '0.350', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.762', 'FRAGCOUNT': '1.000', 'weapon2': '1.092', 'weapon3': '1.768'} +[2023-09-14 14:54:26,417][63806] DAMAGECOUNT value on done: 7300.0 +[2023-09-14 14:54:26,418][63806] Sum rewards: -3.575, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.224', 'AMMO5': '0.003', 'weapon5': '0.016', 'AMMO2': '0.030', 'WEAPON5': '0.050', 'ARMOR': '0.060', 'AMMO3': '0.068', 'HITCOUNT': '0.120', 'AMMO4': '0.152', 'WEAPON3': '0.250', 'WEAPON4': '0.450', 'DAMAGECOUNT': '0.510', 'weapon4': '0.640', 'weapon3': '0.838', 'FRAGCOUNT': '1.000', 'weapon2': '1.712'} +[2023-09-14 14:54:26,752][63770] DAMAGECOUNT value on done: 6799.0 +[2023-09-14 14:54:26,753][63770] Sum rewards: -3.486, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.135', 'weapon7': '0.010', 'AMMO2': '0.010', 'AMMO5': '0.023', 'weapon4': '0.026', 'AMMO4': '0.052', 'WEAPON4': '0.100', 'AMMO3': '0.177', 'weapon5': '0.186', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.350', 'WEAPON5': '0.450', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.227', 'weapon3': '1.498', 'weapon2': '1.690', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:54:27,140][63770] DAMAGECOUNT value on done: 7146.0 +[2023-09-14 14:54:27,140][63770] Sum rewards: -7.135, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.966', 'AMMO2': '0.002', 'WEAPON1': '0.010', 'AMMO4': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.032', 'weapon5': '0.060', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'AMMO3': '0.106', 'weapon4': '0.112', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.128', 'weapon2': '1.560'} +[2023-09-14 14:54:27,467][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001428_5849088.pth... +[2023-09-14 14:54:27,469][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001493_6115328.pth... +[2023-09-14 14:54:27,526][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001132_4636672.pth +[2023-09-14 14:54:27,527][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001135_4648960.pth +[2023-09-14 14:54:27,702][63734] DAMAGECOUNT value on done: 8189.0 +[2023-09-14 14:54:27,702][63734] Sum rewards: -1.994, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.598', 'AMMO5': '0.005', 'AMMO2': '0.007', 'ARMOR': '0.028', 'AMMO4': '0.037', 'weapon7': '0.076', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.106', 'HITCOUNT': '0.120', 'weapon4': '0.184', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.650', 'weapon3': '1.314', 'weapon2': '1.422', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:54:28,074][63735] DAMAGECOUNT value on done: 7719.0 +[2023-09-14 14:54:28,092][63734] DAMAGECOUNT value on done: 7404.0 +[2023-09-14 14:54:28,093][63734] Sum rewards: -2.082, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.507', 'weapon7': '0.002', 'AMMO5': '0.012', 'AMMO2': '0.013', 'ARMOR': '0.032', 'AMMO4': '0.065', 'weapon5': '0.106', 'AMMO3': '0.133', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'WEAPON4': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon4': '0.320', 'DAMAGECOUNT': '0.471', 'WEAPON3': '0.750', 'weapon2': '0.838', 'FRAGCOUNT': '1.000', 'weapon3': '1.812'} +[2023-09-14 14:54:28,352][63733] Updated weights for policy 1, policy_version 1430 (0.0010) +[2023-09-14 14:54:28,416][63735] DAMAGECOUNT value on done: 7824.0 +[2023-09-14 14:54:28,416][63735] Sum rewards: -2.896, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.182', 'AMMO4': '-0.044', 'AMMO2': '-0.009', 'AMMO5': '0.010', 'WEAPON4': '0.100', 'AMMO3': '0.101', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.228', 'ARMOR': '0.535', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.795', 'FRAGCOUNT': '1.000', 'weapon3': '1.412', 'weapon2': '1.508'} +[2023-09-14 14:54:30,860][63769] DAMAGECOUNT value on done: 7703.0 +[2023-09-14 14:54:30,861][63769] Sum rewards: -6.887, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.075', 'AMMO5': '0.017', 'AMMO2': '0.020', 'weapon5': '0.046', 'AMMO4': '0.097', 'HITCOUNT': '0.110', 'AMMO3': '0.137', 'WEAPON5': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.800', 'weapon2': '1.368', 'weapon3': '1.652'} +[2023-09-14 14:54:31,211][63769] DAMAGECOUNT value on done: 7393.0 +[2023-09-14 14:54:31,212][63769] Sum rewards: -4.140, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.255', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'AMMO5': '0.008', 'ARMOR': '0.036', 'AMMO3': '0.134', 'HITCOUNT': '0.140', 'weapon5': '0.246', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.492', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.192', 'weapon3': '1.786'} +[2023-09-14 14:54:32,099][63732] Updated weights for policy 0, policy_version 1500 (0.0011) +[2023-09-14 14:54:33,203][63767] DAMAGECOUNT value on done: 8725.0 +[2023-09-14 14:54:33,203][63767] Sum rewards: -2.800, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.530', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.015', 'AMMO4': '0.075', 'AMMO3': '0.137', 'weapon5': '0.194', 'WEAPON5': '0.200', 'HITCOUNT': '0.240', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.867', 'FRAGCOUNT': '1.000', 'weapon2': '1.282', 'weapon3': '2.000'} +[2023-09-14 14:54:33,537][63767] DAMAGECOUNT value on done: 7597.0 +[2023-09-14 14:54:33,538][63767] Sum rewards: -5.962, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.360', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.014', 'weapon5': '0.056', 'AMMO4': '0.067', 'AMMO3': '0.128', 'HITCOUNT': '0.160', 'WEAPON5': '0.250', 'WEAPON4': '0.350', 'weapon4': '0.440', 'DAMAGECOUNT': '0.561', 'WEAPON3': '0.650', 'weapon2': '1.338', 'weapon3': '1.362', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:54:35,196][63735] DAMAGECOUNT value on done: 7972.0 +[2023-09-14 14:54:35,197][63735] Sum rewards: -2.193, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.332', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO4': '0.021', 'ARMOR': '0.060', 'AMMO3': '0.091', 'HITCOUNT': '0.100', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.435', 'weapon4': '0.502', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.218', 'weapon3': '1.498'} +[2023-09-14 14:54:35,555][63735] DAMAGECOUNT value on done: 5481.0 +[2023-09-14 14:54:35,556][63735] Sum rewards: 1.275, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.672', 'AMMO5': '0.003', 'AMMO2': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.048', 'WEAPON5': '0.050', 'AMMO3': '0.086', 'AMMO4': '0.087', 'weapon5': '0.192', 'WEAPON4': '0.200', 'HITCOUNT': '0.200', 'weapon4': '0.312', 'WEAPON3': '0.450', 'DAMAGECOUNT': '1.104', 'weapon3': '1.214', 'weapon2': '1.464', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:54:35,689][63805] DAMAGECOUNT value on done: 9896.0 +[2023-09-14 14:54:35,689][63805] Sum rewards: -1.017, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-2.290', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.013', 'WEAPON1': '0.020', 'ARMOR': '0.064', 'weapon5': '0.082', 'AMMO3': '0.098', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'weapon4': '0.348', 'WEAPON3': '0.450', 'weapon3': '0.782', 'DAMAGECOUNT': '1.002', 'weapon2': '1.772', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:54:35,825][63733] Updated weights for policy 1, policy_version 1440 (0.0011) +[2023-09-14 14:54:36,073][63805] DAMAGECOUNT value on done: 6578.0 +[2023-09-14 14:54:36,074][63805] Sum rewards: -0.336, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.325', 'ARMOR': '0.012', 'AMMO5': '0.018', 'AMMO2': '0.020', 'weapon4': '0.040', 'WEAPON1': '0.050', 'weapon5': '0.056', 'AMMO3': '0.082', 'WEAPON4': '0.100', 'AMMO4': '0.102', 'HITCOUNT': '0.280', 'WEAPON5': '0.350', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.879', 'weapon3': '1.370', 'weapon2': '1.830', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:54:36,293][63806] DAMAGECOUNT value on done: 5994.0 +[2023-09-14 14:54:36,293][63806] Sum rewards: -2.221, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.840', 'AMMO2': '0.009', 'AMMO5': '0.013', 'AMMO4': '0.043', 'ARMOR': '0.056', 'AMMO3': '0.098', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'weapon5': '0.164', 'HITCOUNT': '0.190', 'weapon4': '0.202', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.900', 'weapon2': '1.030', 'weapon3': '1.864', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:54:36,662][63806] DAMAGECOUNT value on done: 8855.0 +[2023-09-14 14:54:36,662][63806] Sum rewards: -5.646, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.924', 'AMMO2': '0.008', 'ARMOR': '0.032', 'AMMO4': '0.037', 'WEAPON4': '0.100', 'AMMO3': '0.106', 'weapon4': '0.150', 'HITCOUNT': '0.160', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.681', 'FRAGCOUNT': '1.000', 'weapon3': '1.390', 'weapon2': '1.714'} +[2023-09-14 14:54:37,445][63769] DAMAGECOUNT value on done: 8731.0 +[2023-09-14 14:54:37,467][63576] Saving new best policy, reward=-2.810! +[2023-09-14 14:54:37,483][63771] DAMAGECOUNT value on done: 5268.0 +[2023-09-14 14:54:37,483][63771] Sum rewards: -3.224, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.460', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO5': '0.020', 'AMMO4': '0.021', 'weapon4': '0.024', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'weapon7': '0.054', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.131', 'HITCOUNT': '0.150', 'weapon5': '0.158', 'WEAPON7': '0.200', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.850', 'weapon2': '1.300', 'weapon3': '1.758', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:54:37,775][63769] DAMAGECOUNT value on done: 6411.0 +[2023-09-14 14:54:37,775][63769] Sum rewards: -4.015, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.666', 'AMMO5': '0.005', 'AMMO2': '0.013', 'weapon5': '0.020', 'AMMO4': '0.064', 'ARMOR': '0.076', 'WEAPON5': '0.100', 'AMMO3': '0.149', 'HITCOUNT': '0.160', 'WEAPON4': '0.350', 'weapon4': '0.482', 'DAMAGECOUNT': '0.660', 'WEAPON3': '1.000', 'weapon2': '1.230', 'weapon3': '1.842', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:54:37,820][63771] DAMAGECOUNT value on done: 7545.0 +[2023-09-14 14:54:37,821][63771] Sum rewards: -6.640, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.492', 'AMMO4': '-0.037', 'AMMO2': '-0.007', 'AMMO5': '0.017', 'ARMOR': '0.036', 'weapon5': '0.066', 'HITCOUNT': '0.170', 'AMMO3': '0.171', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.567', 'WEAPON3': '1.100', 'weapon2': '1.486', 'weapon3': '1.832', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:54:38,739][63732] Updated weights for policy 0, policy_version 1510 (0.0011) +[2023-09-14 14:54:40,432][63770] DAMAGECOUNT value on done: 8895.0 +[2023-09-14 14:54:40,821][63770] DAMAGECOUNT value on done: 6108.0 +[2023-09-14 14:54:41,529][63767] DAMAGECOUNT value on done: 9585.0 +[2023-09-14 14:54:41,530][63767] Sum rewards: -4.914, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.130', 'AMMO4': '-0.004', 'AMMO2': '-0.001', 'AMMO5': '0.020', 'WEAPON1': '0.030', 'ARMOR': '0.048', 'weapon5': '0.070', 'AMMO3': '0.221', 'HITCOUNT': '0.290', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.930', 'weapon2': '1.196', 'WEAPON3': '1.300', 'weapon3': '2.266', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:54:41,855][63767] DAMAGECOUNT value on done: 9731.0 +[2023-09-14 14:54:41,855][63767] Sum rewards: -5.349, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.030', 'AMMO5': '0.005', 'AMMO2': '0.013', 'weapon5': '0.026', 'WEAPON5': '0.050', 'ARMOR': '0.064', 'AMMO4': '0.064', 'AMMO3': '0.154', 'WEAPON4': '0.200', 'weapon4': '0.330', 'HITCOUNT': '0.350', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.900', 'weapon2': '1.008', 'DAMAGECOUNT': '1.275', 'weapon3': '1.992'} +[2023-09-14 14:54:43,307][63733] Updated weights for policy 1, policy_version 1450 (0.0011) +[2023-09-14 14:54:44,191][63805] DAMAGECOUNT value on done: 9050.0 +[2023-09-14 14:54:44,191][63805] Sum rewards: -3.047, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.510', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'WEAPON5': '0.100', 'AMMO3': '0.131', 'HITCOUNT': '0.250', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.870', 'FRAGCOUNT': '1.000', 'weapon2': '1.446', 'weapon3': '1.922'} +[2023-09-14 14:54:44,547][63805] DAMAGECOUNT value on done: 9033.0 +[2023-09-14 14:54:44,547][63805] Sum rewards: -2.143, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.420', 'AMMO2': '0.004', 'AMMO5': '0.014', 'AMMO4': '0.022', 'ARMOR': '0.040', 'weapon4': '0.092', 'WEAPON4': '0.100', 'AMMO3': '0.140', 'weapon5': '0.152', 'WEAPON5': '0.300', 'HITCOUNT': '0.370', 'WEAPON3': '0.950', 'weapon2': '0.974', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.176', 'weapon3': '2.192'} +[2023-09-14 14:54:45,341][63732] Updated weights for policy 0, policy_version 1520 (0.0010) +[2023-09-14 14:54:46,131][63734] DAMAGECOUNT value on done: 7585.0 +[2023-09-14 14:54:46,132][63734] Sum rewards: -4.110, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.210', 'AMMO5': '0.005', 'weapon5': '0.016', 'AMMO2': '0.021', 'HITCOUNT': '0.080', 'AMMO3': '0.099', 'WEAPON5': '0.100', 'AMMO4': '0.103', 'WEAPON4': '0.250', 'weapon4': '0.266', 'DAMAGECOUNT': '0.435', 'ARMOR': '0.445', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.268', 'weapon2': '1.612'} +[2023-09-14 14:54:46,526][63734] DAMAGECOUNT value on done: 5984.0 +[2023-09-14 14:54:46,527][63734] Sum rewards: -5.726, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.040', 'AMMO2': '0.004', 'AMMO5': '0.005', 'AMMO4': '0.022', 'ARMOR': '0.052', 'HITCOUNT': '0.090', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.148', 'AMMO3': '0.149', 'DAMAGECOUNT': '0.240', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.400', 'weapon3': '1.804'} +[2023-09-14 14:54:47,383][63771] DAMAGECOUNT value on done: 8888.0 +[2023-09-14 14:54:47,383][63771] Sum rewards: -2.624, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.238', 'AMMO5': '0.005', 'AMMO2': '0.023', 'weapon5': '0.026', 'AMMO3': '0.089', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.114', 'ARMOR': '0.152', 'weapon4': '0.182', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.508', 'weapon2': '1.700'} +[2023-09-14 14:54:47,768][63771] DAMAGECOUNT value on done: 6275.0 +[2023-09-14 14:54:47,769][63771] Sum rewards: -0.195, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.069', 'AMMO4': '-0.008', 'AMMO2': '-0.001', 'AMMO5': '0.007', 'ARMOR': '0.008', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'AMMO3': '0.129', 'weapon4': '0.156', 'HITCOUNT': '0.270', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.894', 'weapon2': '1.250', 'weapon3': '1.718', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:54:48,364][63806] DAMAGECOUNT value on done: 8085.0 +[2023-09-14 14:54:48,721][63806] DAMAGECOUNT value on done: 7736.0 +[2023-09-14 14:54:48,721][63806] Sum rewards: 6.558, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.380', 'AMMO2': '0.000', 'AMMO4': '0.000', 'WEAPON1': '0.010', 'AMMO5': '0.013', 'AMMO3': '0.146', 'weapon7': '0.178', 'HITCOUNT': '0.240', 'weapon5': '0.270', 'AMMO6': '0.320', 'AMMO7': '0.320', 'WEAPON5': '0.350', 'WEAPON7': '0.400', 'ARMOR': '0.482', 'WEAPON3': '0.750', 'weapon2': '1.006', 'DAMAGECOUNT': '1.308', 'weapon3': '1.894', 'FRAGCOUNT': '7.000'} +[2023-09-14 14:54:50,760][63735] DAMAGECOUNT value on done: 7868.0 +[2023-09-14 14:54:50,760][63735] Sum rewards: -0.894, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.079', 'AMMO5': '0.003', 'AMMO2': '0.018', 'WEAPON5': '0.050', 'AMMO4': '0.089', 'weapon5': '0.124', 'HITCOUNT': '0.130', 'AMMO3': '0.147', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.447', 'ARMOR': '0.502', 'weapon4': '0.512', 'WEAPON3': '0.800', 'weapon2': '1.132', 'weapon3': '1.432', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:54:50,908][63733] Updated weights for policy 1, policy_version 1460 (0.0011) +[2023-09-14 14:54:51,088][63735] DAMAGECOUNT value on done: 7994.0 +[2023-09-14 14:54:51,089][63735] Sum rewards: -6.598, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.902', 'AMMO2': '0.011', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.053', 'WEAPON4': '0.100', 'weapon5': '0.112', 'AMMO3': '0.131', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'weapon4': '0.326', 'ARMOR': '0.432', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.154', 'weapon2': '1.752'} +[2023-09-14 14:54:51,112][63734] DAMAGECOUNT value on done: 8464.0 +[2023-09-14 14:54:51,112][63734] Sum rewards: 0.149, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.432', 'AMMO2': '0.000', 'AMMO4': '0.002', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.072', 'AMMO3': '0.122', 'WEAPON4': '0.200', 'weapon5': '0.220', 'HITCOUNT': '0.250', 'WEAPON5': '0.300', 'weapon4': '0.452', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.825', 'weapon3': '1.192', 'weapon2': '1.470', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:54:51,513][63734] DAMAGECOUNT value on done: 7961.0 +[2023-09-14 14:54:51,514][63734] Sum rewards: 3.562, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.882', 'AMMO2': '0.006', 'weapon5': '0.006', 'AMMO5': '0.007', 'AMMO4': '0.027', 'ARMOR': '0.067', 'WEAPON4': '0.100', 'AMMO3': '0.139', 'WEAPON5': '0.150', 'weapon4': '0.160', 'HITCOUNT': '0.400', 'WEAPON3': '0.850', 'weapon2': '1.434', 'DAMAGECOUNT': '1.671', 'weapon3': '1.926', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:54:51,857][63770] DAMAGECOUNT value on done: 7041.0 +[2023-09-14 14:54:51,858][63770] Sum rewards: 0.112, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.606', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.022', 'WEAPON4': '0.050', 'weapon4': '0.052', 'AMMO3': '0.122', 'weapon5': '0.152', 'HITCOUNT': '0.160', 'WEAPON5': '0.450', 'ARMOR': '0.513', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.726', 'weapon3': '1.332', 'weapon2': '1.952', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:54:52,143][63732] Updated weights for policy 0, policy_version 1530 (0.0011) +[2023-09-14 14:54:52,246][63770] DAMAGECOUNT value on done: 7415.0 +[2023-09-14 14:54:52,247][63770] Sum rewards: -5.070, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.344', 'AMMO5': '0.015', 'AMMO2': '0.023', 'ARMOR': '0.076', 'AMMO3': '0.113', 'AMMO4': '0.116', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon5': '0.206', 'HITCOUNT': '0.220', 'weapon4': '0.444', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.807', 'FRAGCOUNT': '1.000', 'weapon2': '1.310', 'weapon3': '1.444'} +[2023-09-14 14:54:53,872][63769] DAMAGECOUNT value on done: 8075.0 +[2023-09-14 14:54:53,873][63769] Sum rewards: -0.019, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.354', 'AMMO2': '0.014', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.067', 'weapon5': '0.126', 'AMMO3': '0.139', 'WEAPON4': '0.150', 'WEAPON5': '0.250', 'weapon4': '0.280', 'HITCOUNT': '0.350', 'ARMOR': '0.496', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.116', 'weapon3': '1.316', 'weapon2': '1.696', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:54:54,266][63769] DAMAGECOUNT value on done: 7719.0 +[2023-09-14 14:54:54,266][63769] Sum rewards: -1.679, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.970', 'AMMO5': '0.008', 'AMMO2': '0.021', 'ARMOR': '0.080', 'weapon5': '0.080', 'WEAPON4': '0.100', 'AMMO4': '0.104', 'AMMO3': '0.115', 'weapon4': '0.134', 'WEAPON5': '0.150', 'HITCOUNT': '0.240', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.978', 'weapon2': '1.632', 'weapon3': '1.650', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:54:56,079][63767] DAMAGECOUNT value on done: 9174.0 +[2023-09-14 14:54:56,080][63767] Sum rewards: -4.997, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.301', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'AMMO5': '0.019', 'ARMOR': '0.036', 'AMMO4': '0.042', 'AMMO3': '0.075', 'weapon4': '0.094', 'WEAPON4': '0.100', 'HITCOUNT': '0.240', 'WEAPON5': '0.300', 'weapon5': '0.418', 'WEAPON3': '0.550', 'weapon2': '1.182', 'DAMAGECOUNT': '1.347', 'FRAGCOUNT': '1.500', 'weapon3': '1.632'} +[2023-09-14 14:54:56,451][63767] DAMAGECOUNT value on done: 7770.0 +[2023-09-14 14:54:56,452][63767] Sum rewards: -6.262, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.604', 'weapon5': '0.008', 'AMMO2': '0.012', 'ARMOR': '0.012', 'AMMO5': '0.012', 'AMMO4': '0.058', 'AMMO3': '0.137', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.519', 'weapon4': '0.544', 'weapon2': '0.944', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '1.896'} +[2023-09-14 14:54:57,624][63735] DAMAGECOUNT value on done: 8067.0 +[2023-09-14 14:54:57,925][63735] DAMAGECOUNT value on done: 5636.0 +[2023-09-14 14:54:57,926][63735] Sum rewards: -3.497, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.171', 'AMMO4': '-0.037', 'AMMO2': '-0.007', 'AMMO5': '0.005', 'weapon5': '0.016', 'ARMOR': '0.040', 'WEAPON1': '0.040', 'weapon4': '0.078', 'AMMO3': '0.094', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.140', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.465', 'FRAGCOUNT': '1.000', 'weapon3': '1.132', 'weapon2': '1.808'} +[2023-09-14 14:54:58,321][63733] Updated weights for policy 1, policy_version 1470 (0.0011) +[2023-09-14 14:54:58,429][63806] DAMAGECOUNT value on done: 6129.0 +[2023-09-14 14:54:58,430][63806] Sum rewards: -3.165, reward structure: {'DEATHCOUNT': '-9.000', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.015', 'WEAPON5': '0.050', 'AMMO4': '0.073', 'HEALTH': '0.080', 'AMMO3': '0.099', 'HITCOUNT': '0.110', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.630', 'weapon3': '1.710'} +[2023-09-14 14:54:58,510][63805] DAMAGECOUNT value on done: 10021.0 +[2023-09-14 14:54:58,761][63806] DAMAGECOUNT value on done: 8945.0 +[2023-09-14 14:54:58,809][63732] Updated weights for policy 0, policy_version 1540 (0.0011) +[2023-09-14 14:54:58,844][63805] DAMAGECOUNT value on done: 6992.0 +[2023-09-14 14:54:58,845][63805] Sum rewards: -1.759, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.829', 'AMMO5': '0.003', 'ARMOR': '0.004', 'weapon5': '0.008', 'AMMO2': '0.012', 'WEAPON5': '0.050', 'AMMO4': '0.057', 'AMMO3': '0.113', 'WEAPON4': '0.200', 'weapon4': '0.230', 'HITCOUNT': '0.280', 'WEAPON3': '0.800', 'weapon2': '0.962', 'DAMAGECOUNT': '1.242', 'weapon3': '2.110', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:55:00,229][63769] DAMAGECOUNT value on done: 8797.0 +[2023-09-14 14:55:00,553][63769] DAMAGECOUNT value on done: 6646.0 +[2023-09-14 14:55:00,554][63769] Sum rewards: 0.175, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.990', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'weapon5': '0.048', 'AMMO4': '0.054', 'weapon4': '0.064', 'AMMO3': '0.073', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'HITCOUNT': '0.160', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.705', 'weapon3': '1.614', 'weapon2': '1.618', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:55:00,773][63771] DAMAGECOUNT value on done: 5498.0 +[2023-09-14 14:55:00,774][63771] Sum rewards: -5.819, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.839', 'AMMO2': '0.006', 'WEAPON1': '0.020', 'AMMO5': '0.025', 'AMMO4': '0.030', 'weapon5': '0.050', 'WEAPON4': '0.100', 'AMMO3': '0.194', 'HITCOUNT': '0.220', 'weapon4': '0.220', 'WEAPON5': '0.350', 'ARMOR': '0.473', 'DAMAGECOUNT': '0.690', 'WEAPON3': '1.150', 'weapon2': '1.312', 'weapon3': '1.930', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:55:01,193][63771] DAMAGECOUNT value on done: 8093.0 +[2023-09-14 14:55:01,193][63771] Sum rewards: -3.640, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.716', 'AMMO2': '0.002', 'ARMOR': '0.004', 'AMMO4': '0.008', 'AMMO5': '0.019', 'AMMO3': '0.163', 'weapon5': '0.298', 'WEAPON5': '0.300', 'HITCOUNT': '0.340', 'FRAGCOUNT': '0.500', 'weapon2': '0.540', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.644', 'weapon3': '2.208'} +[2023-09-14 14:55:04,494][63767] DAMAGECOUNT value on done: 9675.0 +[2023-09-14 14:55:04,494][63767] Sum rewards: -3.996, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.542', 'AMMO5': '0.010', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'weapon5': '0.070', 'AMMO4': '0.090', 'HITCOUNT': '0.110', 'AMMO3': '0.124', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.270', 'weapon4': '0.276', 'ARMOR': '0.463', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.344', 'weapon3': '1.450'} +[2023-09-14 14:55:04,850][63767] DAMAGECOUNT value on done: 10195.0 +[2023-09-14 14:55:04,851][63767] Sum rewards: -1.098, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.492', 'AMMO2': '0.004', 'AMMO5': '0.005', 'AMMO4': '0.019', 'weapon5': '0.056', 'WEAPON5': '0.100', 'AMMO3': '0.140', 'WEAPON4': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon4': '0.378', 'HITCOUNT': '0.400', 'ARMOR': '0.472', 'WEAPON3': '0.700', 'weapon3': '1.320', 'DAMAGECOUNT': '1.392', 'weapon2': '1.608', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:55:05,495][63770] DAMAGECOUNT value on done: 9030.0 +[2023-09-14 14:55:05,496][63770] Sum rewards: -3.068, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.771', 'AMMO4': '-0.047', 'AMMO2': '-0.009', 'AMMO5': '0.005', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.122', 'AMMO3': '0.141', 'HITCOUNT': '0.150', 'weapon7': '0.152', 'weapon4': '0.266', 'AMMO6': '0.320', 'AMMO7': '0.320', 'WEAPON7': '0.400', 'DAMAGECOUNT': '0.405', 'ARMOR': '0.460', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.800', 'weapon3': '1.352', 'weapon2': '1.416'} +[2023-09-14 14:55:05,580][63732] Updated weights for policy 0, policy_version 1550 (0.0010) +[2023-09-14 14:55:05,916][63733] Updated weights for policy 1, policy_version 1480 (0.0011) +[2023-09-14 14:55:05,934][63770] DAMAGECOUNT value on done: 6728.0 +[2023-09-14 14:55:05,934][63770] Sum rewards: -1.362, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.169', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'ARMOR': '0.004', 'AMMO5': '0.007', 'weapon5': '0.020', 'AMMO3': '0.101', 'WEAPON5': '0.150', 'HITCOUNT': '0.470', 'WEAPON3': '0.600', 'weapon3': '1.388', 'weapon2': '1.728', 'DAMAGECOUNT': '1.860', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:55:07,501][63805] DAMAGECOUNT value on done: 9268.0 +[2023-09-14 14:55:07,502][63805] Sum rewards: -1.182, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.584', 'AMMO2': '0.003', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO4': '0.016', 'ARMOR': '0.052', 'weapon5': '0.062', 'WEAPON5': '0.100', 'AMMO3': '0.155', 'HITCOUNT': '0.260', 'DAMAGECOUNT': '0.654', 'WEAPON3': '0.750', 'weapon2': '1.150', 'weapon3': '2.184', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:55:07,824][63805] DAMAGECOUNT value on done: 9389.0 +[2023-09-14 14:55:07,824][63805] Sum rewards: -2.168, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.354', 'AMMO5': '0.013', 'AMMO2': '0.029', 'weapon5': '0.068', 'ARMOR': '0.072', 'WEAPON5': '0.100', 'weapon4': '0.118', 'AMMO3': '0.133', 'AMMO4': '0.147', 'WEAPON4': '0.150', 'HITCOUNT': '0.270', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.068', 'weapon3': '1.366', 'weapon2': '1.652', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:55:10,453][63771] DAMAGECOUNT value on done: 9185.0 +[2023-09-14 14:55:10,453][63771] Sum rewards: -4.360, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.942', 'AMMO2': '0.008', 'AMMO5': '0.010', 'weapon5': '0.016', 'AMMO4': '0.040', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.102', 'weapon4': '0.120', 'HITCOUNT': '0.280', 'ARMOR': '0.507', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.891', 'weapon2': '1.472', 'weapon3': '1.586', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:55:10,782][63771] DAMAGECOUNT value on done: 6576.0 +[2023-09-14 14:55:10,805][63806] DAMAGECOUNT value on done: 8554.0 +[2023-09-14 14:55:10,805][63806] Sum rewards: 0.082, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.828', 'AMMO5': '0.006', 'AMMO2': '0.014', 'ARMOR': '0.040', 'AMMO4': '0.069', 'AMMO3': '0.131', 'WEAPON5': '0.150', 'HITCOUNT': '0.200', 'weapon5': '0.212', 'weapon4': '0.218', 'WEAPON4': '0.250', 'WEAPON3': '0.750', 'weapon2': '1.406', 'DAMAGECOUNT': '1.407', 'weapon3': '1.556', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:55:11,113][63734] DAMAGECOUNT value on done: 7734.0 +[2023-09-14 14:55:11,113][63734] Sum rewards: -1.256, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.316', 'AMMO2': '0.009', 'ARMOR': '0.016', 'AMMO5': '0.020', 'AMMO4': '0.045', 'WEAPON4': '0.050', 'AMMO3': '0.105', 'HITCOUNT': '0.160', 'weapon5': '0.202', 'weapon4': '0.254', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.447', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.158', 'weapon3': '1.444'} +[2023-09-14 14:55:11,179][63806] DAMAGECOUNT value on done: 8047.0 +[2023-09-14 14:55:11,180][63806] Sum rewards: -1.178, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.650', 'AMMO2': '0.002', 'AMMO4': '0.007', 'AMMO5': '0.010', 'ARMOR': '0.056', 'WEAPON4': '0.100', 'AMMO3': '0.138', 'weapon5': '0.240', 'HITCOUNT': '0.280', 'WEAPON5': '0.300', 'weapon4': '0.386', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.933', 'weapon2': '1.220', 'weapon3': '1.500', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:55:11,499][63734] DAMAGECOUNT value on done: 6109.0 +[2023-09-14 14:55:11,499][63734] Sum rewards: -4.072, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.381', 'AMMO5': '0.013', 'weapon5': '0.014', 'AMMO2': '0.021', 'WEAPON1': '0.040', 'ARMOR': '0.048', 'AMMO3': '0.072', 'AMMO4': '0.104', 'HITCOUNT': '0.110', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.400', 'weapon4': '0.502', 'weapon3': '0.870', 'FRAGCOUNT': '1.000', 'weapon2': '1.490'} +[2023-09-14 14:55:12,289][63732] Updated weights for policy 0, policy_version 1560 (0.0011) +[2023-09-14 14:55:13,428][63733] Updated weights for policy 1, policy_version 1490 (0.0011) +[2023-09-14 14:55:13,535][63735] DAMAGECOUNT value on done: 8116.0 +[2023-09-14 14:55:13,536][63735] Sum rewards: -2.784, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.440', 'AMMO2': '0.008', 'weapon5': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.039', 'ARMOR': '0.040', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon7': '0.134', 'HITCOUNT': '0.140', 'AMMO3': '0.145', 'WEAPON7': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.228', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.744', 'WEAPON3': '0.800', 'weapon2': '1.362', 'weapon3': '1.604', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:55:13,938][63735] DAMAGECOUNT value on done: 8461.0 +[2023-09-14 14:55:13,939][63735] Sum rewards: 1.164, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.519', 'AMMO2': '0.001', 'AMMO4': '0.004', 'weapon5': '0.012', 'AMMO5': '0.013', 'ARMOR': '0.020', 'WEAPON4': '0.100', 'AMMO3': '0.122', 'weapon4': '0.208', 'WEAPON5': '0.250', 'HITCOUNT': '0.380', 'WEAPON3': '0.850', 'weapon2': '1.048', 'DAMAGECOUNT': '1.401', 'weapon3': '2.024', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:55:14,353][63734] DAMAGECOUNT value on done: 8594.0 +[2023-09-14 14:55:14,353][63734] Sum rewards: -2.315, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.430', 'AMMO2': '0.003', 'AMMO5': '0.014', 'AMMO4': '0.015', 'ARMOR': '0.072', 'weapon5': '0.098', 'AMMO3': '0.115', 'HITCOUNT': '0.120', 'WEAPON4': '0.150', 'weapon4': '0.290', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.034', 'weapon2': '1.714'} +[2023-09-14 14:55:14,700][63734] DAMAGECOUNT value on done: 8209.0 +[2023-09-14 14:55:14,701][63734] Sum rewards: -8.335, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-1.296', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'AMMO2': '0.022', 'weapon5': '0.032', 'weapon4': '0.082', 'AMMO4': '0.111', 'WEAPON4': '0.150', 'AMMO3': '0.171', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'DAMAGECOUNT': '0.744', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.692', 'weapon2': '1.772'} +[2023-09-14 14:55:17,098][63770] DAMAGECOUNT value on done: 7130.0 +[2023-09-14 14:55:17,295][63769] DAMAGECOUNT value on done: 8729.0 +[2023-09-14 14:55:17,295][63769] Sum rewards: 2.295, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.646', 'AMMO4': '-0.017', 'AMMO2': '-0.003', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'ARMOR': '0.020', 'AMMO3': '0.135', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.250', 'weapon5': '0.268', 'HITCOUNT': '0.340', 'WEAPON3': '0.900', 'weapon2': '1.094', 'DAMAGECOUNT': '1.962', 'weapon3': '2.120', 'FRAGCOUNT': '6.000'} +[2023-09-14 14:55:17,517][63770] DAMAGECOUNT value on done: 7710.0 +[2023-09-14 14:55:17,517][63770] Sum rewards: -0.583, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'ARMOR': '0.040', 'AMMO4': '0.044', 'AMMO3': '0.119', 'WEAPON4': '0.150', 'weapon4': '0.164', 'HITCOUNT': '0.200', 'HEALTH': '0.254', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.885', 'weapon2': '1.528', 'weapon3': '1.664', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:55:17,705][63769] DAMAGECOUNT value on done: 7894.0 +[2023-09-14 14:55:17,708][63769] Sum rewards: -7.442, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.648', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO4': '0.022', 'AMMO5': '0.028', 'weapon4': '0.076', 'WEAPON4': '0.100', 'weapon5': '0.108', 'HITCOUNT': '0.160', 'AMMO3': '0.212', 'WEAPON5': '0.450', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.525', 'WEAPON3': '0.900', 'weapon3': '1.484', 'weapon2': '1.626'} +[2023-09-14 14:55:18,831][63767] DAMAGECOUNT value on done: 9249.0 +[2023-09-14 14:55:18,831][63767] Sum rewards: -0.263, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.018', 'weapon5': '0.024', 'HITCOUNT': '0.050', 'AMMO3': '0.076', 'ARMOR': '0.084', 'AMMO4': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.225', 'weapon4': '0.232', 'WEAPON3': '0.450', 'HEALTH': '0.458', 'FRAGCOUNT': '1.000', 'weapon2': '1.184', 'weapon3': '1.578'} +[2023-09-14 14:55:19,138][63732] Updated weights for policy 0, policy_version 1570 (0.0011) +[2023-09-14 14:55:19,184][63767] DAMAGECOUNT value on done: 8275.0 +[2023-09-14 14:55:19,185][63767] Sum rewards: 2.312, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.992', 'AMMO5': '0.005', 'AMMO2': '0.008', 'AMMO4': '0.040', 'weapon5': '0.042', 'AMMO3': '0.080', 'ARMOR': '0.088', 'WEAPON5': '0.100', 'WEAPON4': '0.300', 'weapon4': '0.340', 'HITCOUNT': '0.390', 'WEAPON3': '0.500', 'weapon2': '1.468', 'DAMAGECOUNT': '1.515', 'weapon3': '1.678', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:55:20,362][63735] DAMAGECOUNT value on done: 8279.0 +[2023-09-14 14:55:20,363][63735] Sum rewards: 0.040, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.717', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO2': '0.027', 'AMMO3': '0.081', 'weapon5': '0.128', 'AMMO4': '0.135', 'WEAPON5': '0.150', 'HITCOUNT': '0.190', 'WEAPON4': '0.250', 'weapon4': '0.340', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.636', 'weapon2': '1.232', 'weapon3': '1.460', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:55:20,687][63735] DAMAGECOUNT value on done: 5756.0 +[2023-09-14 14:55:20,996][63806] DAMAGECOUNT value on done: 6508.0 +[2023-09-14 14:55:20,997][63806] Sum rewards: -6.038, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.972', 'AMMO2': '0.008', 'ARMOR': '0.008', 'AMMO4': '0.039', 'WEAPON4': '0.050', 'weapon4': '0.136', 'AMMO3': '0.188', 'HITCOUNT': '0.300', 'weapon2': '0.954', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.137', 'WEAPON3': '1.150', 'weapon3': '2.214'} +[2023-09-14 14:55:21,180][63733] Updated weights for policy 1, policy_version 1500 (0.0010) +[2023-09-14 14:55:21,398][63806] DAMAGECOUNT value on done: 9095.0 +[2023-09-14 14:55:21,399][63806] Sum rewards: -5.251, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.021', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.008', 'AMMO2': '-0.001', 'AMMO5': '0.004', 'WEAPON1': '0.020', 'weapon5': '0.028', 'AMMO3': '0.085', 'WEAPON5': '0.100', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.550', 'weapon3': '1.408', 'weapon2': '1.714'} +[2023-09-14 14:55:21,429][63805] DAMAGECOUNT value on done: 10248.0 +[2023-09-14 14:55:21,429][63805] Sum rewards: -3.757, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.871', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.018', 'weapon4': '0.048', 'ARMOR': '0.060', 'AMMO4': '0.090', 'WEAPON4': '0.100', 'AMMO3': '0.154', 'weapon5': '0.156', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'DAMAGECOUNT': '0.681', 'WEAPON3': '0.850', 'weapon2': '1.260', 'weapon3': '1.996', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:55:21,775][63805] DAMAGECOUNT value on done: 7174.0 +[2023-09-14 14:55:21,776][63805] Sum rewards: -4.792, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.280', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'ARMOR': '0.072', 'AMMO3': '0.122', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.546', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.780', 'weapon3': '1.806'} +[2023-09-14 14:55:23,471][63769] DAMAGECOUNT value on done: 9012.0 +[2023-09-14 14:55:23,797][63769] DAMAGECOUNT value on done: 6934.0 +[2023-09-14 14:55:23,797][63769] Sum rewards: -5.256, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.350', 'AMMO5': '0.003', 'AMMO2': '0.006', 'AMMO4': '0.031', 'AMMO3': '0.146', 'HITCOUNT': '0.230', 'DAMAGECOUNT': '0.864', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.328', 'weapon3': '2.036'} +[2023-09-14 14:55:24,221][63771] DAMAGECOUNT value on done: 5824.0 +[2023-09-14 14:55:24,222][63771] Sum rewards: 0.522, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.855', 'AMMO5': '0.003', 'AMMO2': '0.009', 'weapon5': '0.010', 'ARMOR': '0.040', 'AMMO4': '0.047', 'WEAPON5': '0.050', 'AMMO3': '0.120', 'HITCOUNT': '0.300', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.978', 'weapon3': '1.654', 'weapon2': '1.666', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:55:24,661][63771] DAMAGECOUNT value on done: 8309.0 +[2023-09-14 14:55:24,662][63771] Sum rewards: -0.917, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.976', 'weapon5': '0.002', 'AMMO5': '0.010', 'AMMO2': '0.030', 'ARMOR': '0.052', 'AMMO3': '0.147', 'AMMO4': '0.148', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'WEAPON4': '0.350', 'weapon4': '0.546', 'DAMAGECOUNT': '0.648', 'WEAPON3': '0.750', 'weapon2': '0.760', 'weapon3': '1.796', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:55:25,957][63732] Updated weights for policy 0, policy_version 1580 (0.0011) +[2023-09-14 14:55:27,947][63767] DAMAGECOUNT value on done: 9785.0 +[2023-09-14 14:55:27,948][63767] Sum rewards: -1.616, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.078', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.051', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.113', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.330', 'weapon4': '0.344', 'ARMOR': '0.567', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.320', 'weapon3': '1.462'} +[2023-09-14 14:55:28,311][63767] DAMAGECOUNT value on done: 11140.0 +[2023-09-14 14:55:28,312][63767] Sum rewards: 5.121, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.926', 'AMMO2': '0.017', 'AMMO5': '0.027', 'weapon7': '0.038', 'ARMOR': '0.056', 'AMMO4': '0.083', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.116', 'WEAPON4': '0.250', 'weapon5': '0.260', 'HITCOUNT': '0.300', 'WEAPON5': '0.350', 'weapon4': '0.462', 'WEAPON3': '0.650', 'weapon2': '1.060', 'weapon3': '1.492', 'DAMAGECOUNT': '2.835', 'FRAGCOUNT': '4.500'} +[2023-09-14 14:55:28,768][63733] Updated weights for policy 1, policy_version 1510 (0.0011) +[2023-09-14 14:55:30,779][63805] DAMAGECOUNT value on done: 9490.0 +[2023-09-14 14:55:30,779][63805] Sum rewards: -5.836, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.314', 'AMMO5': '0.010', 'AMMO2': '0.016', 'AMMO4': '0.080', 'WEAPON4': '0.100', 'ARMOR': '0.112', 'weapon5': '0.122', 'AMMO3': '0.139', 'HITCOUNT': '0.190', 'WEAPON5': '0.250', 'weapon4': '0.278', 'DAMAGECOUNT': '0.666', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.362', 'weapon3': '1.602'} +[2023-09-14 14:55:30,969][63770] DAMAGECOUNT value on done: 9523.0 +[2023-09-14 14:55:30,969][63770] Sum rewards: 3.513, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.426', 'AMMO5': '0.010', 'AMMO2': '0.018', 'AMMO3': '0.070', 'AMMO4': '0.091', 'ARMOR': '0.116', 'WEAPON4': '0.150', 'weapon5': '0.196', 'weapon4': '0.214', 'WEAPON5': '0.250', 'HITCOUNT': '0.390', 'WEAPON3': '0.450', 'weapon2': '0.858', 'DAMAGECOUNT': '1.479', 'weapon3': '1.646', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:55:31,107][63805] DAMAGECOUNT value on done: 9837.0 +[2023-09-14 14:55:31,108][63805] Sum rewards: 0.947, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.267', 'weapon4': '0.010', 'AMMO2': '0.011', 'AMMO5': '0.018', 'ARMOR': '0.028', 'AMMO4': '0.055', 'WEAPON4': '0.100', 'weapon5': '0.132', 'AMMO3': '0.186', 'WEAPON5': '0.300', 'HITCOUNT': '0.400', 'WEAPON3': '0.900', 'weapon2': '1.202', 'DAMAGECOUNT': '1.344', 'weapon3': '2.278', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:55:31,421][63770] DAMAGECOUNT value on done: 6833.0 +[2023-09-14 14:55:31,422][63770] Sum rewards: -2.918, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.399', 'AMMO2': '0.003', 'AMMO4': '0.012', 'AMMO5': '0.015', 'ARMOR': '0.016', 'WEAPON1': '0.020', 'weapon5': '0.030', 'HITCOUNT': '0.100', 'AMMO3': '0.107', 'WEAPON4': '0.150', 'weapon4': '0.282', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.352', 'weapon3': '1.580'} +[2023-09-14 14:55:32,646][63732] Updated weights for policy 0, policy_version 1590 (0.0011) +[2023-09-14 14:55:33,637][63771] DAMAGECOUNT value on done: 9585.0 +[2023-09-14 14:55:33,637][63771] Sum rewards: -1.684, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.060', 'AMMO4': '-0.045', 'AMMO2': '-0.009', 'ARMOR': '0.044', 'AMMO3': '0.082', 'WEAPON4': '0.200', 'weapon4': '0.240', 'HITCOUNT': '0.260', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.200', 'weapon3': '1.358', 'weapon2': '1.946', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:55:33,838][63806] DAMAGECOUNT value on done: 8998.0 +[2023-09-14 14:55:33,839][63806] Sum rewards: 1.916, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.536', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'WEAPON1': '0.010', 'AMMO5': '0.022', 'AMMO3': '0.138', 'weapon5': '0.152', 'weapon7': '0.188', 'HITCOUNT': '0.300', 'WEAPON5': '0.400', 'AMMO6': '0.420', 'AMMO7': '0.420', 'ARMOR': '0.487', 'WEAPON7': '0.500', 'WEAPON3': '0.850', 'weapon2': '1.186', 'DAMAGECOUNT': '1.332', 'weapon3': '1.822', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:55:34,034][63771] DAMAGECOUNT value on done: 6663.0 +[2023-09-14 14:55:34,221][63806] DAMAGECOUNT value on done: 8087.0 +[2023-09-14 14:55:34,221][63806] Sum rewards: -7.248, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.148', 'AMMO2': '0.016', 'AMMO5': '0.023', 'ARMOR': '0.023', 'WEAPON1': '0.030', 'HITCOUNT': '0.050', 'AMMO4': '0.081', 'WEAPON4': '0.100', 'DAMAGECOUNT': '0.120', 'AMMO3': '0.127', 'weapon4': '0.204', 'weapon5': '0.280', 'WEAPON5': '0.400', 'WEAPON3': '0.550', 'weapon2': '1.428', 'weapon3': '1.468'} +[2023-09-14 14:55:36,344][63733] Updated weights for policy 1, policy_version 1520 (0.0011) +[2023-09-14 14:55:36,420][63734] DAMAGECOUNT value on done: 8091.0 +[2023-09-14 14:55:36,421][63734] Sum rewards: 1.501, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO5': '0.007', 'ARMOR': '0.008', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'weapon4': '0.026', 'AMMO4': '0.082', 'AMMO3': '0.113', 'weapon5': '0.116', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon7': '0.122', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.250', 'HEALTH': '0.362', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.071', 'weapon2': '1.086', 'weapon3': '1.990', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:55:36,439][63735] DAMAGECOUNT value on done: 8354.0 +[2023-09-14 14:55:36,439][63735] Sum rewards: -4.055, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.393', 'AMMO5': '0.010', 'AMMO2': '0.012', 'AMMO4': '0.062', 'ARMOR': '0.068', 'weapon5': '0.090', 'WEAPON5': '0.100', 'AMMO3': '0.148', 'WEAPON4': '0.250', 'HITCOUNT': '0.250', 'weapon4': '0.298', 'DAMAGECOUNT': '0.714', 'WEAPON3': '0.850', 'weapon2': '1.262', 'weapon3': '1.724', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:55:36,809][63734] DAMAGECOUNT value on done: 6279.0 +[2023-09-14 14:55:36,814][63735] DAMAGECOUNT value on done: 9011.0 +[2023-09-14 14:55:36,814][63735] Sum rewards: -1.071, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.923', 'weapon7': '0.006', 'AMMO5': '0.007', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'weapon5': '0.012', 'ARMOR': '0.040', 'AMMO4': '0.047', 'WEAPON4': '0.050', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.124', 'AMMO3': '0.164', 'HITCOUNT': '0.390', 'WEAPON3': '0.850', 'weapon2': '1.228', 'DAMAGECOUNT': '1.650', 'weapon3': '2.114', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:55:38,033][63734] DAMAGECOUNT value on done: 8833.0 +[2023-09-14 14:55:38,390][63734] DAMAGECOUNT value on done: 8459.0 +[2023-09-14 14:55:38,391][63734] Sum rewards: -5.022, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.530', 'AMMO4': '-0.043', 'AMMO2': '-0.009', 'AMMO5': '0.013', 'weapon5': '0.034', 'HITCOUNT': '0.150', 'AMMO3': '0.165', 'WEAPON5': '0.250', 'ARMOR': '0.456', 'DAMAGECOUNT': '0.750', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon2': '1.098', 'weapon3': '2.344'} +[2023-09-14 14:55:39,377][63732] Updated weights for policy 0, policy_version 1600 (0.0011) +[2023-09-14 14:55:40,579][63769] DAMAGECOUNT value on done: 8902.0 +[2023-09-14 14:55:40,580][63769] Sum rewards: -3.594, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.836', 'weapon7': '0.002', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'weapon5': '0.064', 'ARMOR': '0.076', 'AMMO4': '0.083', 'HITCOUNT': '0.120', 'AMMO3': '0.165', 'WEAPON5': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON4': '0.250', 'weapon4': '0.412', 'DAMAGECOUNT': '0.519', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.292', 'weapon3': '1.572'} +[2023-09-14 14:55:40,984][63769] DAMAGECOUNT value on done: 8279.0 +[2023-09-14 14:55:40,984][63769] Sum rewards: 2.262, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.530', 'weapon5': '0.002', 'AMMO5': '0.005', 'AMMO2': '0.014', 'ARMOR': '0.040', 'AMMO4': '0.067', 'WEAPON5': '0.100', 'AMMO3': '0.131', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.260', 'weapon4': '0.294', 'WEAPON4': '0.300', 'WEAPON3': '0.800', 'weapon2': '1.144', 'DAMAGECOUNT': '1.155', 'weapon3': '1.880', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:55:41,871][63767] DAMAGECOUNT value on done: 9518.0 +[2023-09-14 14:55:41,871][63767] Sum rewards: 0.061, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.670', 'AMMO2': '0.002', 'AMMO5': '0.005', 'AMMO4': '0.009', 'weapon4': '0.014', 'WEAPON1': '0.020', 'weapon5': '0.034', 'ARMOR': '0.036', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'AMMO3': '0.104', 'HITCOUNT': '0.220', 'DAMAGECOUNT': '0.807', 'WEAPON3': '0.850', 'weapon2': '1.314', 'weapon3': '1.916', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:55:42,286][63767] DAMAGECOUNT value on done: 8335.0 +[2023-09-14 14:55:42,287][63767] Sum rewards: -1.838, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.495', 'AMMO2': '0.001', 'AMMO4': '0.007', 'WEAPON1': '0.020', 'ARMOR': '0.020', 'WEAPON4': '0.050', 'HITCOUNT': '0.070', 'AMMO3': '0.105', 'DAMAGECOUNT': '0.180', 'weapon4': '0.180', 'WEAPON3': '0.700', 'weapon2': '0.978', 'weapon3': '1.346', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:55:42,465][63770] DAMAGECOUNT value on done: 7475.0 +[2023-09-14 14:55:42,465][63770] Sum rewards: -1.088, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.935', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'weapon5': '0.002', 'AMMO5': '0.003', 'WEAPON5': '0.050', 'AMMO3': '0.117', 'WEAPON4': '0.200', 'weapon4': '0.272', 'HITCOUNT': '0.290', 'ARMOR': '0.508', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.035', 'weapon2': '1.126', 'weapon3': '1.698', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:55:42,857][63770] DAMAGECOUNT value on done: 7900.0 +[2023-09-14 14:55:42,857][63770] Sum rewards: -4.657, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.712', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'AMMO5': '0.013', 'weapon5': '0.014', 'ARMOR': '0.036', 'AMMO4': '0.044', 'WEAPON4': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.160', 'weapon4': '0.180', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.114', 'weapon3': '1.966'} +[2023-09-14 14:55:42,867][63735] DAMAGECOUNT value on done: 8409.0 +[2023-09-14 14:55:42,868][63735] Sum rewards: -2.975, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.587', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.003', 'AMMO2': '0.003', 'weapon5': '0.006', 'AMMO4': '0.013', 'WEAPON1': '0.020', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'AMMO3': '0.070', 'HITCOUNT': '0.080', 'weapon4': '0.086', 'WEAPON4': '0.100', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.390', 'weapon3': '1.304', 'weapon2': '1.594'} +[2023-09-14 14:55:43,246][63735] DAMAGECOUNT value on done: 5915.0 +[2023-09-14 14:55:43,247][63735] Sum rewards: -9.864, reward structure: {'DEATHCOUNT': '-15.000', 'HEALTH': '-1.596', 'AMMO2': '0.009', 'AMMO4': '0.044', 'ARMOR': '0.108', 'weapon4': '0.126', 'WEAPON4': '0.150', 'AMMO3': '0.176', 'HITCOUNT': '0.200', 'DAMAGECOUNT': '0.477', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.680', 'weapon3': '1.912'} +[2023-09-14 14:55:43,616][63770] Large shaping reward 2.606 for [('FRAGCOUNT', 2.0, 2.0), ('HITCOUNT', 0.05, 5), ('DAMAGECOUNT', 0.555, 185.0), ('AMMO3', -0.001, -2.0), ('weapon3', 0.002)] +[2023-09-14 14:55:43,678][63806] DAMAGECOUNT value on done: 6771.0 +[2023-09-14 14:55:43,678][63806] Sum rewards: -2.079, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.386', 'AMMO5': '0.005', 'AMMO2': '0.009', 'AMMO4': '0.045', 'weapon4': '0.048', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.136', 'weapon5': '0.140', 'HITCOUNT': '0.250', 'DAMAGECOUNT': '0.789', 'WEAPON3': '0.850', 'weapon2': '0.976', 'weapon3': '2.108', 'FRAGCOUNT': '2.500'} +[2023-09-14 14:55:44,022][63806] DAMAGECOUNT value on done: 9295.0 +[2023-09-14 14:55:44,023][63806] Sum rewards: -8.228, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.926', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'weapon5': '0.006', 'ARMOR': '0.016', 'AMMO5': '0.019', 'WEAPON1': '0.020', 'WEAPON4': '0.100', 'weapon4': '0.104', 'HITCOUNT': '0.150', 'AMMO3': '0.168', 'WEAPON5': '0.200', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.600', 'WEAPON3': '1.000', 'weapon3': '1.368', 'weapon2': '1.466'} +[2023-09-14 14:55:44,123][63733] Updated weights for policy 1, policy_version 1530 (0.0010) +[2023-09-14 14:55:44,255][63805] DAMAGECOUNT value on done: 10508.0 +[2023-09-14 14:55:44,255][63805] Sum rewards: -6.969, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-0.524', 'weapon5': '0.002', 'AMMO2': '0.004', 'AMMO5': '0.012', 'AMMO4': '0.017', 'ARMOR': '0.080', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'AMMO3': '0.168', 'DAMAGECOUNT': '0.780', 'WEAPON3': '1.000', 'weapon2': '1.394', 'FRAGCOUNT': '2.000', 'weapon3': '2.048'} +[2023-09-14 14:55:44,617][63805] DAMAGECOUNT value on done: 7174.0 +[2023-09-14 14:55:45,747][63732] Updated weights for policy 0, policy_version 1610 (0.0010) +[2023-09-14 14:55:46,442][63769] DAMAGECOUNT value on done: 9157.0 +[2023-09-14 14:55:46,442][63769] Sum rewards: -0.210, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.489', 'AMMO4': '-0.055', 'AMMO2': '-0.011', 'AMMO3': '0.083', 'HITCOUNT': '0.090', 'ARMOR': '0.432', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon2': '1.478', 'weapon3': '1.626'} +[2023-09-14 14:55:46,838][63769] DAMAGECOUNT value on done: 7169.0 +[2023-09-14 14:55:46,839][63769] Sum rewards: -5.983, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.626', 'AMMO4': '-0.033', 'AMMO2': '-0.007', 'WEAPON4': '0.100', 'AMMO3': '0.149', 'weapon4': '0.174', 'HITCOUNT': '0.180', 'ARMOR': '0.471', 'DAMAGECOUNT': '0.705', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.254', 'weapon2': '2.000'} +[2023-09-14 14:55:47,896][63771] DAMAGECOUNT value on done: 6124.0 +[2023-09-14 14:55:47,897][63771] Sum rewards: -7.017, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-3.605', 'FRAGCOUNT': '0.000', 'AMMO2': '0.004', 'AMMO5': '0.013', 'AMMO4': '0.022', 'ARMOR': '0.056', 'weapon5': '0.100', 'AMMO3': '0.149', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'weapon4': '0.270', 'DAMAGECOUNT': '0.900', 'WEAPON3': '1.050', 'weapon2': '1.296', 'weapon3': '1.848'} +[2023-09-14 14:55:48,294][63771] DAMAGECOUNT value on done: 8627.0 +[2023-09-14 14:55:48,294][63771] Sum rewards: -3.730, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.080', 'AMMO2': '0.007', 'AMMO5': '0.007', 'AMMO4': '0.035', 'weapon5': '0.078', 'AMMO3': '0.153', 'WEAPON5': '0.200', 'HITCOUNT': '0.250', 'WEAPON4': '0.250', 'weapon4': '0.480', 'ARMOR': '0.511', 'WEAPON3': '0.950', 'DAMAGECOUNT': '0.954', 'weapon2': '1.166', 'weapon3': '1.558', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:55:51,041][63767] DAMAGECOUNT value on done: 9871.0 +[2023-09-14 14:55:51,041][63767] Sum rewards: -2.278, reward structure: {'DEATHCOUNT': '-5.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.722', 'AMMO2': '0.008', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.029', 'AMMO4': '0.040', 'HITCOUNT': '0.050', 'AMMO3': '0.062', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.150', 'weapon7': '0.152', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.258', 'WEAPON5': '0.300', 'weapon4': '0.326', 'weapon5': '0.366', 'WEAPON3': '0.400', 'weapon3': '1.044', 'weapon2': '1.532'} +[2023-09-14 14:55:51,441][63767] DAMAGECOUNT value on done: 11240.0 +[2023-09-14 14:55:51,441][63767] Sum rewards: 0.925, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.484', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'AMMO5': '0.017', 'weapon4': '0.034', 'AMMO4': '0.082', 'WEAPON4': '0.100', 'AMMO3': '0.103', 'HITCOUNT': '0.120', 'weapon5': '0.202', 'DAMAGECOUNT': '0.300', 'WEAPON5': '0.350', 'ARMOR': '0.412', 'WEAPON3': '0.550', 'weapon2': '1.210', 'weapon3': '1.652', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:55:51,859][63732] Updated weights for policy 0, policy_version 1620 (0.0011) +[2023-09-14 14:55:52,822][63733] Updated weights for policy 1, policy_version 1540 (0.0011) +[2023-09-14 14:55:53,862][63805] DAMAGECOUNT value on done: 9898.0 +[2023-09-14 14:55:53,862][63805] Sum rewards: -1.889, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.868', 'AMMO5': '0.012', 'AMMO2': '0.033', 'weapon7': '0.068', 'weapon5': '0.082', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.141', 'HITCOUNT': '0.150', 'AMMO4': '0.162', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.264', 'WEAPON3': '0.800', 'weapon2': '1.158', 'DAMAGECOUNT': '1.224', 'weapon3': '1.434', 'FRAGCOUNT': '2.500'} +[2023-09-14 14:55:54,261][63805] DAMAGECOUNT value on done: 9931.0 +[2023-09-14 14:55:54,262][63805] Sum rewards: -3.161, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.536', 'AMMO5': '0.017', 'AMMO2': '0.037', 'ARMOR': '0.044', 'HITCOUNT': '0.090', 'weapon5': '0.104', 'AMMO3': '0.135', 'AMMO4': '0.183', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.282', 'weapon4': '0.386', 'WEAPON4': '0.400', 'WEAPON3': '0.900', 'weapon2': '1.130', 'weapon3': '1.918', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:55:56,322][63770] DAMAGECOUNT value on done: 10010.0 +[2023-09-14 14:55:56,322][63770] Sum rewards: -0.143, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.868', 'AMMO2': '0.010', 'AMMO5': '0.011', 'WEAPON4': '0.050', 'AMMO4': '0.051', 'weapon5': '0.134', 'AMMO3': '0.173', 'WEAPON5': '0.250', 'ARMOR': '0.400', 'HITCOUNT': '0.400', 'WEAPON3': '1.000', 'weapon2': '1.276', 'DAMAGECOUNT': '1.461', 'weapon3': '2.258', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:55:56,712][63770] DAMAGECOUNT value on done: 7233.0 +[2023-09-14 14:55:56,712][63770] Sum rewards: -0.470, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.680', 'AMMO5': '0.003', 'AMMO2': '0.008', 'AMMO4': '0.039', 'WEAPON5': '0.050', 'weapon4': '0.082', 'WEAPON4': '0.150', 'AMMO3': '0.178', 'HITCOUNT': '0.220', 'ARMOR': '0.440', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.200', 'weapon3': '1.614', 'weapon2': '1.826', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:55:56,764][63806] DAMAGECOUNT value on done: 9163.0 +[2023-09-14 14:55:56,785][63771] DAMAGECOUNT value on done: 9885.0 +[2023-09-14 14:55:56,785][63771] Sum rewards: -4.456, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.530', 'AMMO4': '-0.030', 'AMMO2': '-0.006', 'AMMO5': '0.005', 'weapon5': '0.006', 'ARMOR': '0.024', 'WEAPON5': '0.100', 'AMMO3': '0.142', 'HITCOUNT': '0.230', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.900', 'weapon2': '1.302', 'FRAGCOUNT': '2.000', 'weapon3': '2.000'} +[2023-09-14 14:55:57,162][63806] DAMAGECOUNT value on done: 8321.0 +[2023-09-14 14:55:57,162][63806] Sum rewards: 1.196, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.089', 'AMMO2': '0.024', 'AMMO5': '0.030', 'WEAPON4': '0.100', 'AMMO3': '0.114', 'AMMO4': '0.118', 'HITCOUNT': '0.220', 'weapon5': '0.320', 'WEAPON5': '0.450', 'weapon4': '0.452', 'WEAPON3': '0.500', 'ARMOR': '0.557', 'DAMAGECOUNT': '0.702', 'weapon3': '1.348', 'weapon2': '1.350', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:55:57,173][63771] DAMAGECOUNT value on done: 7043.0 +[2023-09-14 14:55:57,173][63771] Sum rewards: -5.124, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.028', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'WEAPON4': '0.050', 'AMMO3': '0.177', 'HITCOUNT': '0.240', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.140', 'weapon3': '1.722', 'weapon2': '1.800', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:55:57,912][63732] Updated weights for policy 0, policy_version 1630 (0.0010) +[2023-09-14 14:55:59,508][63735] DAMAGECOUNT value on done: 8686.0 +[2023-09-14 14:55:59,508][63735] Sum rewards: -7.301, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.770', 'AMMO4': '-0.019', 'AMMO2': '-0.004', 'AMMO5': '0.025', 'weapon5': '0.052', 'AMMO3': '0.189', 'WEAPON5': '0.300', 'HITCOUNT': '0.320', 'DAMAGECOUNT': '0.996', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon3': '1.790', 'weapon2': '1.820'} +[2023-09-14 14:55:59,822][63735] DAMAGECOUNT value on done: 9591.0 +[2023-09-14 14:55:59,822][63735] Sum rewards: -2.823, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.159', 'AMMO4': '-0.003', 'AMMO2': '-0.000', 'AMMO5': '0.015', 'weapon5': '0.100', 'weapon4': '0.106', 'WEAPON4': '0.150', 'AMMO3': '0.180', 'WEAPON5': '0.300', 'HITCOUNT': '0.430', 'WEAPON3': '1.100', 'weapon2': '1.420', 'DAMAGECOUNT': '1.740', 'weapon3': '2.048', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:56:00,774][63733] Updated weights for policy 1, policy_version 1550 (0.0011) +[2023-09-14 14:56:01,809][63734] DAMAGECOUNT value on done: 9358.0 +[2023-09-14 14:56:01,810][63734] Sum rewards: 2.006, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.336', 'AMMO5': '0.019', 'AMMO2': '0.019', 'AMMO4': '0.096', 'ARMOR': '0.108', 'AMMO3': '0.143', 'WEAPON4': '0.150', 'weapon5': '0.150', 'HITCOUNT': '0.270', 'WEAPON5': '0.300', 'weapon4': '0.356', 'WEAPON3': '0.750', 'weapon2': '1.274', 'DAMAGECOUNT': '1.575', 'weapon3': '1.632', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:56:01,862][63734] DAMAGECOUNT value on done: 8306.0 +[2023-09-14 14:56:01,862][63734] Sum rewards: -3.814, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.698', 'AMMO2': '0.003', 'AMMO5': '0.007', 'AMMO4': '0.015', 'WEAPON4': '0.050', 'weapon4': '0.096', 'AMMO3': '0.115', 'WEAPON5': '0.150', 'weapon5': '0.182', 'HITCOUNT': '0.210', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.750', 'ARMOR': '0.900', 'weapon2': '1.346', 'weapon3': '1.914'} +[2023-09-14 14:56:02,218][63734] DAMAGECOUNT value on done: 8633.0 +[2023-09-14 14:56:02,218][63734] Sum rewards: -2.582, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.335', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'weapon5': '0.026', 'AMMO2': '0.033', 'ARMOR': '0.063', 'AMMO4': '0.163', 'HITCOUNT': '0.170', 'AMMO3': '0.173', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'weapon4': '0.322', 'DAMAGECOUNT': '0.522', 'weapon2': '0.840', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '2.212'} +[2023-09-14 14:56:02,314][63734] DAMAGECOUNT value on done: 6403.0 +[2023-09-14 14:56:02,315][63734] Sum rewards: -4.927, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.896', 'AMMO2': '0.001', 'AMMO4': '0.007', 'WEAPON1': '0.020', 'weapon4': '0.034', 'ARMOR': '0.048', 'WEAPON4': '0.100', 'HITCOUNT': '0.120', 'AMMO3': '0.131', 'DAMAGECOUNT': '0.372', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.646', 'weapon2': '1.690'} +[2023-09-14 14:56:03,989][63769] DAMAGECOUNT value on done: 9087.0 +[2023-09-14 14:56:03,990][63769] Sum rewards: -3.758, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.851', 'AMMO2': '0.017', 'AMMO5': '0.028', 'WEAPON4': '0.050', 'weapon5': '0.056', 'AMMO4': '0.085', 'ARMOR': '0.144', 'AMMO3': '0.161', 'HITCOUNT': '0.180', 'weapon4': '0.180', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.555', 'WEAPON3': '1.050', 'weapon2': '1.092', 'FRAGCOUNT': '2.000', 'weapon3': '2.046'} +[2023-09-14 14:56:04,382][63769] DAMAGECOUNT value on done: 8523.0 +[2023-09-14 14:56:04,383][63769] Sum rewards: -1.934, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.552', 'AMMO5': '0.013', 'AMMO2': '0.015', 'weapon5': '0.072', 'AMMO4': '0.072', 'AMMO3': '0.133', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'HITCOUNT': '0.260', 'weapon4': '0.464', 'ARMOR': '0.476', 'DAMAGECOUNT': '0.732', 'weapon2': '0.786', 'WEAPON3': '0.850', 'weapon3': '1.646', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:56:04,814][63767] DAMAGECOUNT value on done: 9782.0 +[2023-09-14 14:56:04,814][63767] Sum rewards: -4.030, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.307', 'AMMO5': '0.003', 'AMMO2': '0.025', 'weapon5': '0.036', 'WEAPON5': '0.050', 'AMMO3': '0.114', 'AMMO4': '0.124', 'ARMOR': '0.144', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'weapon4': '0.414', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.792', 'WEAPON3': '0.800', 'weapon2': '1.162', 'weapon3': '1.694'} +[2023-09-14 14:56:04,890][63732] Updated weights for policy 0, policy_version 1640 (0.0012) +[2023-09-14 14:56:05,180][63735] DAMAGECOUNT value on done: 8638.0 +[2023-09-14 14:56:05,180][63735] Sum rewards: -2.481, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.418', 'AMMO2': '0.002', 'weapon5': '0.006', 'AMMO5': '0.010', 'AMMO4': '0.010', 'WEAPON4': '0.050', 'ARMOR': '0.072', 'WEAPON5': '0.100', 'weapon4': '0.100', 'AMMO3': '0.129', 'HITCOUNT': '0.200', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.687', 'FRAGCOUNT': '1.000', 'weapon3': '1.476', 'weapon2': '1.944'} +[2023-09-14 14:56:05,185][63767] DAMAGECOUNT value on done: 8723.0 +[2023-09-14 14:56:05,186][63767] Sum rewards: 0.636, reward structure: {'DEATHCOUNT': '-9.750', 'AMMO5': '0.012', 'weapon4': '0.016', 'AMMO2': '0.017', 'WEAPON4': '0.050', 'AMMO4': '0.085', 'HEALTH': '0.113', 'AMMO3': '0.128', 'weapon5': '0.188', 'WEAPON5': '0.200', 'HITCOUNT': '0.280', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.164', 'weapon3': '1.610', 'weapon2': '1.872', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:56:05,528][63735] DAMAGECOUNT value on done: 6250.0 +[2023-09-14 14:56:05,528][63735] Sum rewards: -3.283, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.854', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.005', 'weapon5': '0.018', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.128', 'weapon4': '0.130', 'HITCOUNT': '0.290', 'ARMOR': '0.442', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.005', 'weapon2': '1.236', 'weapon3': '1.962', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:56:05,632][63806] DAMAGECOUNT value on done: 7081.0 +[2023-09-14 14:56:05,633][63806] Sum rewards: 0.525, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO5': '0.005', 'weapon5': '0.006', 'WEAPON1': '0.010', 'AMMO2': '0.023', 'WEAPON5': '0.050', 'weapon7': '0.074', 'AMMO3': '0.095', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO4': '0.115', 'WEAPON4': '0.150', 'HITCOUNT': '0.220', 'HEALTH': '0.368', 'weapon4': '0.394', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.930', 'weapon3': '1.174', 'weapon2': '1.360', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:56:06,021][63806] DAMAGECOUNT value on done: 9355.0 +[2023-09-14 14:56:06,713][63805] DAMAGECOUNT value on done: 10643.0 +[2023-09-14 14:56:06,714][63805] Sum rewards: -5.581, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.850', 'ARMOR': '0.004', 'AMMO2': '0.007', 'AMMO5': '0.007', 'AMMO4': '0.034', 'WEAPON5': '0.050', 'HITCOUNT': '0.080', 'weapon4': '0.114', 'AMMO3': '0.136', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.342', 'weapon3': '1.790'} +[2023-09-14 14:56:07,034][63805] DAMAGECOUNT value on done: 7266.0 +[2023-09-14 14:56:07,840][63733] Updated weights for policy 1, policy_version 1560 (0.0012) +[2023-09-14 14:56:07,942][63770] DAMAGECOUNT value on done: 7683.0 +[2023-09-14 14:56:07,942][63770] Sum rewards: 2.704, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-0.885', 'AMMO2': '0.004', 'AMMO5': '0.007', 'AMMO4': '0.018', 'WEAPON1': '0.020', 'weapon7': '0.054', 'ARMOR': '0.072', 'AMMO3': '0.084', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'weapon5': '0.306', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.624', 'weapon3': '0.912', 'weapon2': '1.358', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:56:08,289][63770] DAMAGECOUNT value on done: 8010.0 +[2023-09-14 14:56:08,290][63770] Sum rewards: -2.474, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.294', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.047', 'weapon5': '0.054', 'AMMO3': '0.062', 'HITCOUNT': '0.080', 'WEAPON5': '0.100', 'ARMOR': '0.108', 'WEAPON4': '0.200', 'weapon4': '0.240', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.450', 'weapon3': '0.826', 'weapon2': '1.808', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:56:09,413][63769] DAMAGECOUNT value on done: 9447.0 +[2023-09-14 14:56:09,414][63769] Sum rewards: 0.571, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.700', 'AMMO2': '0.001', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO4': '0.006', 'ARMOR': '0.052', 'WEAPON5': '0.100', 'AMMO3': '0.120', 'HITCOUNT': '0.200', 'WEAPON4': '0.300', 'weapon4': '0.396', 'DAMAGECOUNT': '0.870', 'WEAPON3': '0.900', 'weapon2': '1.050', 'weapon3': '2.014', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:56:09,752][63769] DAMAGECOUNT value on done: 7214.0 +[2023-09-14 14:56:11,266][63771] DAMAGECOUNT value on done: 6563.0 +[2023-09-14 14:56:11,267][63771] Sum rewards: -1.060, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.638', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'ARMOR': '0.020', 'weapon7': '0.026', 'AMMO2': '0.036', 'AMMO3': '0.103', 'weapon5': '0.126', 'WEAPON5': '0.150', 'AMMO4': '0.180', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON4': '0.250', 'weapon4': '0.298', 'HITCOUNT': '0.300', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.317', 'weapon2': '1.584', 'weapon3': '1.660', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:56:11,594][63771] DAMAGECOUNT value on done: 9090.0 +[2023-09-14 14:56:11,594][63771] Sum rewards: 2.349, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.424', 'AMMO5': '0.003', 'AMMO2': '0.012', 'weapon5': '0.026', 'WEAPON5': '0.050', 'AMMO4': '0.061', 'AMMO3': '0.097', 'WEAPON4': '0.150', 'weapon4': '0.336', 'HITCOUNT': '0.430', 'WEAPON3': '0.500', 'ARMOR': '0.505', 'weapon2': '1.210', 'DAMAGECOUNT': '1.389', 'weapon3': '1.504', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:56:11,988][63732] Updated weights for policy 0, policy_version 1650 (0.0010) +[2023-09-14 14:56:13,520][63767] DAMAGECOUNT value on done: 10394.0 +[2023-09-14 14:56:13,520][63767] Sum rewards: -6.370, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.306', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.012', 'weapon5': '0.048', 'WEAPON4': '0.100', 'weapon4': '0.124', 'WEAPON5': '0.150', 'AMMO3': '0.176', 'HITCOUNT': '0.310', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.548', 'weapon3': '1.778', 'weapon2': '1.786'} +[2023-09-14 14:56:13,840][63767] DAMAGECOUNT value on done: 11870.0 +[2023-09-14 14:56:13,840][63767] Sum rewards: 0.744, reward structure: {'DEATHCOUNT': '-11.250', 'ARMOR': '0.008', 'AMMO5': '0.012', 'AMMO2': '0.042', 'AMMO3': '0.148', 'weapon4': '0.162', 'WEAPON5': '0.200', 'AMMO4': '0.211', 'WEAPON4': '0.350', 'weapon5': '0.360', 'HEALTH': '0.430', 'HITCOUNT': '0.430', 'WEAPON3': '0.750', 'weapon2': '0.866', 'DAMAGECOUNT': '1.890', 'weapon3': '2.134', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:56:14,526][63769] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:56:14,875][63733] Updated weights for policy 1, policy_version 1570 (0.0010) +[2023-09-14 14:56:16,787][63805] DAMAGECOUNT value on done: 10098.0 +[2023-09-14 14:56:17,182][63805] DAMAGECOUNT value on done: 10311.0 +[2023-09-14 14:56:17,182][63805] Sum rewards: 0.792, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.152', 'AMMO5': '0.005', 'AMMO2': '0.024', 'weapon7': '0.044', 'ARMOR': '0.045', 'WEAPON5': '0.100', 'AMMO3': '0.103', 'AMMO4': '0.121', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.234', 'HITCOUNT': '0.330', 'WEAPON4': '0.400', 'WEAPON3': '0.500', 'weapon4': '0.714', 'weapon3': '1.092', 'DAMAGECOUNT': '1.140', 'weapon2': '1.492', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:56:18,901][63806] DAMAGECOUNT value on done: 9313.0 +[2023-09-14 14:56:18,901][63806] Sum rewards: -5.330, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.706', 'AMMO5': '0.008', 'AMMO2': '0.012', 'AMMO4': '0.058', 'weapon5': '0.070', 'ARMOR': '0.090', 'WEAPON4': '0.100', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'AMMO3': '0.163', 'weapon4': '0.166', 'DAMAGECOUNT': '0.450', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.750', 'weapon3': '1.598', 'weapon2': '1.612'} +[2023-09-14 14:56:19,340][63806] DAMAGECOUNT value on done: 8578.0 +[2023-09-14 14:56:19,341][63806] Sum rewards: -2.428, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.494', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'AMMO2': '0.022', 'WEAPON4': '0.050', 'ARMOR': '0.052', 'WEAPON5': '0.100', 'AMMO4': '0.112', 'AMMO3': '0.128', 'HITCOUNT': '0.230', 'DAMAGECOUNT': '0.771', 'WEAPON3': '0.800', 'weapon2': '1.568', 'weapon3': '1.958', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:56:19,375][63732] Updated weights for policy 0, policy_version 1660 (0.0011) +[2023-09-14 14:56:20,132][63771] DAMAGECOUNT value on done: 9962.0 +[2023-09-14 14:56:20,133][63771] Sum rewards: -5.833, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.433', 'AMMO2': '0.007', 'AMMO4': '0.035', 'HITCOUNT': '0.080', 'AMMO3': '0.120', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.231', 'weapon4': '0.254', 'ARMOR': '0.488', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.460', 'weapon2': '1.574'} +[2023-09-14 14:56:20,472][63771] DAMAGECOUNT value on done: 7198.0 +[2023-09-14 14:56:20,473][63771] Sum rewards: -3.231, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.003', 'weapon4': '0.012', 'WEAPON1': '0.020', 'AMMO2': '0.020', 'HEALTH': '0.046', 'WEAPON5': '0.050', 'ARMOR': '0.060', 'AMMO4': '0.101', 'AMMO3': '0.104', 'weapon5': '0.124', 'HITCOUNT': '0.140', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.600', 'weapon2': '1.456', 'weapon3': '1.668'} +[2023-09-14 14:56:20,551][63771] Large shaping reward 2.642 for [('FRAGCOUNT', 2.0, 2.0), ('HITCOUNT', 0.04, 4.0), ('DAMAGECOUNT', 0.6, 200), ('weapon7', 0.002)] +[2023-09-14 14:56:22,210][63770] DAMAGECOUNT value on done: 10529.0 +[2023-09-14 14:56:22,210][63770] Sum rewards: 1.222, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.704', 'AMMO2': '0.008', 'AMMO5': '0.017', 'AMMO4': '0.039', 'weapon7': '0.046', 'weapon4': '0.060', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.153', 'HITCOUNT': '0.220', 'WEAPON5': '0.300', 'weapon5': '0.430', 'ARMOR': '0.496', 'WEAPON3': '0.750', 'weapon3': '1.172', 'weapon2': '1.528', 'DAMAGECOUNT': '1.557', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:56:22,470][63733] Updated weights for policy 1, policy_version 1580 (0.0010) +[2023-09-14 14:56:22,708][63770] DAMAGECOUNT value on done: 7407.0 +[2023-09-14 14:56:22,709][63770] Sum rewards: -1.564, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.738', 'AMMO5': '0.003', 'AMMO2': '0.020', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'AMMO4': '0.100', 'AMMO3': '0.107', 'HITCOUNT': '0.180', 'WEAPON4': '0.250', 'weapon4': '0.304', 'DAMAGECOUNT': '0.522', 'WEAPON3': '0.700', 'weapon2': '1.320', 'weapon3': '1.798', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:56:25,872][63735] DAMAGECOUNT value on done: 8826.0 +[2023-09-14 14:56:25,872][63735] Sum rewards: 1.067, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.506', 'AMMO5': '0.005', 'AMMO2': '0.009', 'ARMOR': '0.032', 'AMMO4': '0.042', 'weapon5': '0.076', 'AMMO3': '0.089', 'WEAPON5': '0.100', 'HITCOUNT': '0.130', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.550', 'weapon2': '1.226', 'weapon3': '1.394', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:56:26,240][63735] DAMAGECOUNT value on done: 10096.0 +[2023-09-14 14:56:26,240][63735] Sum rewards: 1.351, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.830', 'AMMO2': '0.015', 'AMMO5': '0.028', 'AMMO4': '0.073', 'WEAPON4': '0.100', 'AMMO3': '0.142', 'weapon5': '0.262', 'weapon4': '0.264', 'WEAPON5': '0.300', 'HITCOUNT': '0.400', 'WEAPON3': '0.900', 'weapon2': '1.326', 'DAMAGECOUNT': '1.515', 'weapon3': '1.856', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:56:26,416][63734] DAMAGECOUNT value on done: 9493.0 +[2023-09-14 14:56:26,417][63734] Sum rewards: -3.791, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.870', 'FRAGCOUNT': '-1.500', 'AMMO4': '-0.041', 'AMMO2': '-0.008', 'AMMO5': '0.018', 'ARMOR': '0.056', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.104', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.127', 'weapon5': '0.130', 'weapon7': '0.198', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.800', 'weapon3': '1.118', 'weapon2': '1.932'} +[2023-09-14 14:56:26,787][63734] DAMAGECOUNT value on done: 9063.0 +[2023-09-14 14:56:26,787][63734] Sum rewards: -0.942, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.514', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.012', 'AMMO4': '0.057', 'weapon4': '0.124', 'ARMOR': '0.141', 'weapon5': '0.144', 'WEAPON4': '0.150', 'AMMO3': '0.177', 'WEAPON5': '0.200', 'HITCOUNT': '0.290', 'WEAPON3': '1.050', 'weapon2': '1.282', 'DAMAGECOUNT': '1.290', 'weapon3': '2.138', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:56:27,467][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001586_6496256.pth... +[2023-09-14 14:56:27,467][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001669_6836224.pth... +[2023-09-14 14:56:27,523][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001274_5218304.pth +[2023-09-14 14:56:27,526][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001314_5382144.pth +[2023-09-14 14:56:27,891][63732] Updated weights for policy 0, policy_version 1670 (0.0011) +[2023-09-14 14:56:28,114][63734] DAMAGECOUNT value on done: 8757.0 +[2023-09-14 14:56:28,114][63734] Sum rewards: -0.023, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.475', 'AMMO2': '0.008', 'AMMO5': '0.015', 'AMMO4': '0.041', 'WEAPON4': '0.050', 'weapon5': '0.126', 'AMMO3': '0.147', 'weapon4': '0.194', 'WEAPON5': '0.250', 'HITCOUNT': '0.390', 'ARMOR': '0.416', 'WEAPON3': '0.900', 'weapon2': '0.966', 'DAMAGECOUNT': '1.353', 'weapon3': '2.346', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:56:28,308][63806] DAMAGECOUNT value on done: 7348.0 +[2023-09-14 14:56:28,483][63734] DAMAGECOUNT value on done: 6742.0 +[2023-09-14 14:56:28,484][63734] Sum rewards: -4.219, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.343', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'weapon5': '0.002', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'ARMOR': '0.044', 'weapon4': '0.058', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.170', 'HITCOUNT': '0.200', 'DAMAGECOUNT': '1.017', 'weapon2': '1.142', 'WEAPON3': '1.150', 'weapon3': '2.402', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:56:28,747][63806] DAMAGECOUNT value on done: 9434.0 +[2023-09-14 14:56:28,785][63767] DAMAGECOUNT value on done: 9977.0 +[2023-09-14 14:56:28,973][63769] DAMAGECOUNT value on done: 9342.0 +[2023-09-14 14:56:28,973][63769] Sum rewards: -1.064, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.261', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.028', 'WEAPON4': '0.050', 'AMMO3': '0.114', 'weapon4': '0.134', 'AMMO4': '0.138', 'WEAPON5': '0.200', 'weapon5': '0.246', 'HITCOUNT': '0.260', 'ARMOR': '0.440', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.765', 'FRAGCOUNT': '1.000', 'weapon3': '1.576', 'weapon2': '1.826'} +[2023-09-14 14:56:29,150][63767] DAMAGECOUNT value on done: 9339.0 +[2023-09-14 14:56:29,151][63767] Sum rewards: 2.088, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.200', 'AMMO5': '0.005', 'AMMO2': '0.007', 'AMMO4': '0.033', 'weapon5': '0.098', 'WEAPON5': '0.100', 'AMMO3': '0.101', 'weapon4': '0.174', 'WEAPON4': '0.200', 'ARMOR': '0.400', 'HITCOUNT': '0.420', 'WEAPON3': '0.700', 'weapon2': '1.284', 'weapon3': '1.668', 'DAMAGECOUNT': '1.848', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:56:29,338][63769] DAMAGECOUNT value on done: 8872.0 +[2023-09-14 14:56:29,339][63769] Sum rewards: -4.811, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.128', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'AMMO5': '0.014', 'ARMOR': '0.068', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.150', 'AMMO3': '0.156', 'weapon5': '0.156', 'weapon4': '0.268', 'WEAPON5': '0.300', 'HITCOUNT': '0.310', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.047', 'weapon2': '1.364', 'weapon3': '1.786'} +[2023-09-14 14:56:29,611][63735] DAMAGECOUNT value on done: 8938.0 +[2023-09-14 14:56:29,611][63735] Sum rewards: -1.449, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.660', 'AMMO2': '0.033', 'ARMOR': '0.072', 'AMMO3': '0.115', 'AMMO4': '0.167', 'WEAPON4': '0.200', 'HITCOUNT': '0.240', 'weapon4': '0.338', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.900', 'weapon3': '0.978', 'FRAGCOUNT': '1.000', 'weapon2': '2.168'} +[2023-09-14 14:56:29,929][63735] DAMAGECOUNT value on done: 6575.0 +[2023-09-14 14:56:29,929][63735] Sum rewards: -2.709, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.534', 'AMMO2': '0.005', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.027', 'weapon5': '0.028', 'AMMO3': '0.121', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.975', 'weapon3': '1.742', 'weapon2': '1.744', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:56:30,202][63733] Updated weights for policy 1, policy_version 1590 (0.0011) +[2023-09-14 14:56:30,729][63805] DAMAGECOUNT value on done: 10768.0 +[2023-09-14 14:56:30,729][63805] Sum rewards: 1.332, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.760', 'AMMO2': '0.008', 'AMMO5': '0.012', 'weapon5': '0.016', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'AMMO4': '0.041', 'WEAPON4': '0.050', 'AMMO3': '0.071', 'HITCOUNT': '0.120', 'weapon4': '0.134', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.375', 'WEAPON3': '0.500', 'weapon3': '1.350', 'weapon2': '1.694', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:56:31,136][63805] DAMAGECOUNT value on done: 7641.0 +[2023-09-14 14:56:31,136][63805] Sum rewards: -3.823, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.862', 'AMMO2': '0.007', 'AMMO5': '0.012', 'ARMOR': '0.024', 'AMMO4': '0.037', 'AMMO3': '0.127', 'weapon5': '0.128', 'HITCOUNT': '0.190', 'WEAPON5': '0.250', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.125', 'weapon2': '1.500', 'weapon3': '1.688'} +[2023-09-14 14:56:33,293][63769] DAMAGECOUNT value on done: 9467.0 +[2023-09-14 14:56:33,673][63769] DAMAGECOUNT value on done: 7368.0 +[2023-09-14 14:56:34,495][63770] DAMAGECOUNT value on done: 8109.0 +[2023-09-14 14:56:34,496][63770] Sum rewards: 0.245, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.984', 'AMMO2': '0.019', 'weapon4': '0.040', 'ARMOR': '0.068', 'AMMO4': '0.094', 'WEAPON4': '0.100', 'AMMO3': '0.154', 'HITCOUNT': '0.340', 'WEAPON3': '0.950', 'DAMAGECOUNT': '1.278', 'weapon2': '1.422', 'weapon3': '2.264', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:56:34,683][63732] Updated weights for policy 0, policy_version 1680 (0.0011) +[2023-09-14 14:56:34,952][63770] DAMAGECOUNT value on done: 8090.0 +[2023-09-14 14:56:34,953][63770] Sum rewards: -5.176, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.909', 'AMMO2': '0.008', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'AMMO4': '0.039', 'weapon4': '0.062', 'weapon5': '0.068', 'HITCOUNT': '0.080', 'ARMOR': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.161', 'DAMAGECOUNT': '0.240', 'WEAPON5': '0.250', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.490', 'weapon3': '1.872'} +[2023-09-14 14:56:36,222][63771] DAMAGECOUNT value on done: 7027.0 +[2023-09-14 14:56:36,223][63771] Sum rewards: -1.728, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.405', 'AMMO4': '-0.074', 'AMMO2': '-0.015', 'AMMO5': '0.006', 'WEAPON4': '0.100', 'AMMO3': '0.121', 'weapon5': '0.142', 'WEAPON5': '0.150', 'weapon4': '0.196', 'HITCOUNT': '0.330', 'ARMOR': '0.489', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.950', 'weapon2': '1.246', 'DAMAGECOUNT': '1.392', 'weapon3': '1.894'} +[2023-09-14 14:56:36,558][63771] DAMAGECOUNT value on done: 9774.0 +[2023-09-14 14:56:36,559][63771] Sum rewards: 4.506, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.812', 'AMMO2': '0.001', 'AMMO4': '0.002', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'ARMOR': '0.036', 'weapon7': '0.062', 'AMMO3': '0.096', 'WEAPON5': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'HITCOUNT': '0.310', 'WEAPON3': '0.550', 'weapon2': '1.462', 'weapon3': '1.604', 'DAMAGECOUNT': '1.890', 'FRAGCOUNT': '7.000'} +[2023-09-14 14:56:37,471][63454] Saving new best policy, reward=-2.096! +[2023-09-14 14:56:37,927][63767] DAMAGECOUNT value on done: 10782.0 +[2023-09-14 14:56:37,927][63767] Sum rewards: 0.319, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.932', 'AMMO2': '0.004', 'AMMO5': '0.009', 'AMMO4': '0.018', 'WEAPON1': '0.020', 'weapon7': '0.048', 'WEAPON4': '0.050', 'AMMO3': '0.072', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon4': '0.158', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'weapon5': '0.310', 'ARMOR': '0.479', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.164', 'weapon2': '1.204', 'weapon3': '1.214'} +[2023-09-14 14:56:38,087][63733] Updated weights for policy 1, policy_version 1600 (0.0011) +[2023-09-14 14:56:38,267][63767] DAMAGECOUNT value on done: 12272.0 +[2023-09-14 14:56:38,267][63767] Sum rewards: -2.446, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.778', 'AMMO2': '0.015', 'AMMO5': '0.020', 'ARMOR': '0.040', 'AMMO4': '0.074', 'WEAPON4': '0.100', 'weapon5': '0.114', 'AMMO3': '0.123', 'weapon4': '0.204', 'HITCOUNT': '0.260', 'WEAPON5': '0.350', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.206', 'weapon2': '1.358', 'weapon3': '1.618', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:56:41,061][63732] Updated weights for policy 0, policy_version 1690 (0.0011) +[2023-09-14 14:56:41,760][63806] DAMAGECOUNT value on done: 9433.0 +[2023-09-14 14:56:41,761][63806] Sum rewards: -4.980, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.854', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'AMMO5': '0.005', 'ARMOR': '0.036', 'HITCOUNT': '0.070', 'weapon5': '0.076', 'WEAPON5': '0.100', 'AMMO3': '0.157', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.750', 'weapon2': '1.410', 'weapon3': '1.936'} +[2023-09-14 14:56:41,779][63805] DAMAGECOUNT value on done: 10217.0 +[2023-09-14 14:56:41,779][63805] Sum rewards: 0.853, reward structure: {'DEATHCOUNT': '-5.250', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'AMMO2': '0.027', 'AMMO3': '0.092', 'HITCOUNT': '0.130', 'AMMO4': '0.135', 'WEAPON5': '0.300', 'weapon5': '0.308', 'DAMAGECOUNT': '0.357', 'WEAPON3': '0.400', 'HEALTH': '0.498', 'FRAGCOUNT': '1.000', 'weapon2': '1.190', 'weapon3': '1.638'} +[2023-09-14 14:56:42,071][63806] DAMAGECOUNT value on done: 8699.0 +[2023-09-14 14:56:42,120][63805] DAMAGECOUNT value on done: 10478.0 +[2023-09-14 14:56:42,120][63805] Sum rewards: -8.578, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.058', 'AMMO2': '0.007', 'ARMOR': '0.016', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'AMMO4': '0.034', 'weapon4': '0.078', 'AMMO3': '0.115', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'WEAPON5': '0.300', 'weapon5': '0.434', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.501', 'WEAPON3': '0.700', 'weapon3': '1.222', 'weapon2': '1.986'} +[2023-09-14 14:56:42,462][63454] Saving new best policy, reward=-2.017! +[2023-09-14 14:56:43,540][63771] DAMAGECOUNT value on done: 10180.0 +[2023-09-14 14:56:43,540][63771] Sum rewards: -4.373, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.157', 'AMMO4': '-0.046', 'AMMO2': '-0.009', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'ARMOR': '0.020', 'weapon5': '0.072', 'AMMO3': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.210', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.654', 'FRAGCOUNT': '1.000', 'weapon3': '1.548', 'weapon2': '1.820'} +[2023-09-14 14:56:43,926][63771] DAMAGECOUNT value on done: 7333.0 +[2023-09-14 14:56:43,927][63771] Sum rewards: -3.539, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.300', 'AMMO2': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'HITCOUNT': '0.080', 'AMMO4': '0.086', 'AMMO3': '0.106', 'WEAPON4': '0.150', 'weapon4': '0.268', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.268', 'weapon2': '1.974'} +[2023-09-14 14:56:46,190][63733] Updated weights for policy 1, policy_version 1610 (0.0010) +[2023-09-14 14:56:47,499][63732] Updated weights for policy 0, policy_version 1700 (0.0010) +[2023-09-14 14:56:48,374][63770] DAMAGECOUNT value on done: 10706.0 +[2023-09-14 14:56:48,375][63770] Sum rewards: -2.738, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.214', 'AMMO2': '0.013', 'AMMO5': '0.015', 'ARMOR': '0.049', 'AMMO4': '0.064', 'AMMO3': '0.090', 'WEAPON4': '0.150', 'HITCOUNT': '0.160', 'weapon5': '0.240', 'WEAPON5': '0.250', 'weapon4': '0.256', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.531', 'weapon3': '1.442', 'weapon2': '1.716'} +[2023-09-14 14:56:48,820][63770] DAMAGECOUNT value on done: 7632.0 +[2023-09-14 14:56:50,156][63734] DAMAGECOUNT value on done: 9722.0 +[2023-09-14 14:56:50,157][63734] Sum rewards: -4.873, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.282', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'AMMO5': '0.011', 'ARMOR': '0.016', 'weapon5': '0.126', 'HITCOUNT': '0.140', 'AMMO3': '0.197', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.687', 'WEAPON3': '0.950', 'weapon2': '1.364', 'FRAGCOUNT': '2.000', 'weapon3': '2.200'} +[2023-09-14 14:56:50,379][63735] DAMAGECOUNT value on done: 8998.0 +[2023-09-14 14:56:50,379][63735] Sum rewards: -5.852, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.575', 'AMMO5': '0.005', 'AMMO2': '0.007', 'AMMO4': '0.034', 'WEAPON5': '0.050', 'ARMOR': '0.088', 'WEAPON4': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.147', 'weapon4': '0.198', 'DAMAGECOUNT': '0.516', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.380', 'weapon2': '1.958'} +[2023-09-14 14:56:50,481][63734] DAMAGECOUNT value on done: 9302.0 +[2023-09-14 14:56:50,482][63734] Sum rewards: 1.310, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.013', 'weapon4': '0.022', 'AMMO2': '0.024', 'weapon5': '0.042', 'WEAPON4': '0.050', 'HEALTH': '0.064', 'AMMO3': '0.093', 'AMMO4': '0.118', 'WEAPON5': '0.150', 'HITCOUNT': '0.200', 'ARMOR': '0.536', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.717', 'FRAGCOUNT': '1.000', 'weapon3': '1.430', 'weapon2': '1.552'} +[2023-09-14 14:56:50,786][63735] DAMAGECOUNT value on done: 10720.0 +[2023-09-14 14:56:50,786][63735] Sum rewards: -1.223, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.202', 'AMMO2': '0.007', 'AMMO5': '0.019', 'AMMO4': '0.035', 'weapon4': '0.110', 'AMMO3': '0.127', 'WEAPON4': '0.200', 'HITCOUNT': '0.340', 'weapon5': '0.344', 'WEAPON5': '0.350', 'WEAPON3': '0.850', 'ARMOR': '0.924', 'weapon3': '1.350', 'DAMAGECOUNT': '1.872', 'weapon2': '1.950', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:56:51,632][63767] DAMAGECOUNT value on done: 10362.0 +[2023-09-14 14:56:51,632][63767] Sum rewards: 1.111, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.381', 'AMMO2': '0.011', 'ARMOR': '0.032', 'AMMO4': '0.057', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON4': '0.100', 'weapon7': '0.100', 'AMMO3': '0.175', 'weapon4': '0.248', 'HITCOUNT': '0.300', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.155', 'weapon2': '1.712', 'weapon3': '1.752', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:56:51,863][63735] DAMAGECOUNT value on done: 9072.0 +[2023-09-14 14:56:51,864][63735] Sum rewards: 0.094, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.724', 'AMMO4': '-0.031', 'AMMO2': '-0.006', 'AMMO5': '0.005', 'AMMO3': '0.054', 'weapon5': '0.062', 'WEAPON5': '0.100', 'HITCOUNT': '0.130', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.402', 'weapon3': '1.110', 'weapon2': '1.842', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:56:52,042][63767] DAMAGECOUNT value on done: 9484.0 +[2023-09-14 14:56:52,196][63769] DAMAGECOUNT value on done: 9482.0 +[2023-09-14 14:56:52,197][63769] Sum rewards: -4.544, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.024', 'WEAPON1': '0.010', 'AMMO5': '0.020', 'AMMO2': '0.033', 'ARMOR': '0.036', 'HITCOUNT': '0.100', 'AMMO3': '0.130', 'AMMO4': '0.165', 'weapon5': '0.172', 'weapon4': '0.178', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.420', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.850', 'weapon2': '1.346', 'weapon3': '1.920'} +[2023-09-14 14:56:52,280][63735] DAMAGECOUNT value on done: 6925.0 +[2023-09-14 14:56:52,280][63735] Sum rewards: -1.649, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.949', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'weapon5': '0.016', 'ARMOR': '0.068', 'AMMO3': '0.092', 'WEAPON5': '0.100', 'HITCOUNT': '0.250', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.050', 'weapon2': '1.438', 'FRAGCOUNT': '1.500', 'weapon3': '1.666'} +[2023-09-14 14:56:52,462][63454] Saving new best policy, reward=-1.873! +[2023-09-14 14:56:52,555][63769] DAMAGECOUNT value on done: 9071.0 +[2023-09-14 14:56:52,693][63806] DAMAGECOUNT value on done: 7635.0 +[2023-09-14 14:56:52,693][63806] Sum rewards: -0.864, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.663', 'AMMO2': '0.006', 'AMMO5': '0.007', 'AMMO4': '0.029', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'weapon7': '0.080', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon5': '0.104', 'AMMO3': '0.122', 'WEAPON5': '0.150', 'weapon4': '0.204', 'HITCOUNT': '0.230', 'weapon2': '0.776', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.861', 'weapon3': '2.048', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:56:53,057][63806] DAMAGECOUNT value on done: 9519.0 +[2023-09-14 14:56:53,057][63806] Sum rewards: -2.024, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.708', 'AMMO5': '0.003', 'AMMO2': '0.007', 'weapon5': '0.014', 'AMMO4': '0.033', 'WEAPON5': '0.050', 'ARMOR': '0.063', 'HITCOUNT': '0.070', 'AMMO3': '0.074', 'WEAPON4': '0.100', 'weapon4': '0.224', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.312', 'weapon2': '1.730'} +[2023-09-14 14:56:53,201][63805] DAMAGECOUNT value on done: 10783.0 +[2023-09-14 14:56:53,245][63734] DAMAGECOUNT value on done: 8940.0 +[2023-09-14 14:56:53,245][63734] Sum rewards: -6.650, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.842', 'FRAGCOUNT': '-0.500', 'weapon4': '0.004', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.017', 'ARMOR': '0.052', 'AMMO4': '0.086', 'WEAPON4': '0.100', 'weapon5': '0.146', 'AMMO3': '0.163', 'HITCOUNT': '0.170', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.549', 'WEAPON3': '0.750', 'weapon2': '1.574', 'weapon3': '2.058'} +[2023-09-14 14:56:53,518][63805] DAMAGECOUNT value on done: 7958.0 +[2023-09-14 14:56:53,518][63805] Sum rewards: -4.586, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.968', 'AMMO2': '0.000', 'AMMO4': '0.001', 'AMMO5': '0.015', 'weapon5': '0.042', 'ARMOR': '0.056', 'AMMO3': '0.170', 'WEAPON5': '0.200', 'HITCOUNT': '0.270', 'DAMAGECOUNT': '0.951', 'WEAPON3': '1.000', 'weapon2': '1.550', 'weapon3': '1.626', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:56:53,571][63734] DAMAGECOUNT value on done: 7125.0 +[2023-09-14 14:56:53,572][63734] Sum rewards: -0.477, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.418', 'AMMO2': '0.015', 'AMMO4': '0.075', 'WEAPON4': '0.100', 'AMMO3': '0.110', 'ARMOR': '0.116', 'weapon4': '0.128', 'HITCOUNT': '0.320', 'WEAPON3': '0.450', 'DAMAGECOUNT': '1.149', 'weapon3': '1.206', 'weapon2': '2.022', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:56:53,834][63732] Updated weights for policy 0, policy_version 1710 (0.0011) +[2023-09-14 14:56:54,664][63733] Updated weights for policy 1, policy_version 1620 (0.0011) +[2023-09-14 14:56:57,466][63454] Saving new best policy, reward=-1.831! +[2023-09-14 14:56:58,155][63769] DAMAGECOUNT value on done: 9777.0 +[2023-09-14 14:56:58,156][63769] Sum rewards: -2.985, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.888', 'weapon7': '0.004', 'AMMO5': '0.015', 'weapon5': '0.028', 'AMMO2': '0.029', 'ARMOR': '0.040', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.139', 'weapon4': '0.140', 'AMMO4': '0.142', 'WEAPON5': '0.200', 'HITCOUNT': '0.250', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.930', 'WEAPON3': '0.950', 'weapon2': '1.350', 'weapon3': '2.086', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:56:58,623][63769] DAMAGECOUNT value on done: 7443.0 +[2023-09-14 14:56:58,623][63769] Sum rewards: -5.758, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.272', 'AMMO5': '0.003', 'AMMO2': '0.012', 'weapon5': '0.026', 'WEAPON5': '0.050', 'ARMOR': '0.059', 'AMMO4': '0.059', 'HITCOUNT': '0.070', 'AMMO3': '0.140', 'DAMAGECOUNT': '0.225', 'WEAPON4': '0.250', 'weapon4': '0.344', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.092', 'weapon3': '1.884'} +[2023-09-14 14:56:59,622][63771] DAMAGECOUNT value on done: 7454.0 +[2023-09-14 14:56:59,622][63771] Sum rewards: 1.036, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.984', 'WEAPON1': '0.020', 'AMMO2': '0.020', 'AMMO5': '0.023', 'weapon5': '0.080', 'ARMOR': '0.088', 'AMMO4': '0.100', 'AMMO3': '0.125', 'weapon4': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.350', 'HITCOUNT': '0.360', 'WEAPON3': '0.800', 'weapon2': '1.250', 'DAMAGECOUNT': '1.281', 'weapon3': '2.144', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:56:59,789][63732] Updated weights for policy 0, policy_version 1720 (0.0011) +[2023-09-14 14:56:59,942][63770] DAMAGECOUNT value on done: 8490.0 +[2023-09-14 14:56:59,942][63770] Sum rewards: 0.728, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.412', 'AMMO2': '0.007', 'AMMO5': '0.017', 'AMMO4': '0.033', 'ARMOR': '0.036', 'weapon5': '0.076', 'AMMO3': '0.184', 'WEAPON5': '0.300', 'HITCOUNT': '0.330', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.143', 'weapon2': '1.540', 'weapon3': '2.224', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:57:00,024][63771] DAMAGECOUNT value on done: 10151.0 +[2023-09-14 14:57:00,025][63771] Sum rewards: -0.832, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.789', 'AMMO2': '0.006', 'AMMO5': '0.028', 'AMMO4': '0.028', 'ARMOR': '0.040', 'AMMO3': '0.144', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'weapon5': '0.282', 'weapon4': '0.374', 'WEAPON5': '0.550', 'WEAPON3': '0.800', 'weapon2': '1.050', 'DAMAGECOUNT': '1.131', 'weapon3': '1.854', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:57:00,407][63770] DAMAGECOUNT value on done: 8110.0 +[2023-09-14 14:57:00,839][63767] DAMAGECOUNT value on done: 10909.0 +[2023-09-14 14:57:00,840][63767] Sum rewards: -1.698, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.974', 'AMMO2': '0.013', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'AMMO4': '0.062', 'WEAPON4': '0.100', 'HITCOUNT': '0.130', 'AMMO3': '0.149', 'weapon4': '0.162', 'weapon5': '0.256', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.381', 'ARMOR': '0.404', 'WEAPON3': '0.950', 'weapon2': '1.090', 'weapon3': '2.192', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:57:01,250][63767] DAMAGECOUNT value on done: 12499.0 +[2023-09-14 14:57:01,251][63767] Sum rewards: 4.713, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.047', 'AMMO5': '0.007', 'weapon5': '0.034', 'AMMO2': '0.037', 'AMMO3': '0.083', 'WEAPON5': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon7': '0.126', 'HITCOUNT': '0.140', 'WEAPON4': '0.150', 'AMMO4': '0.183', 'WEAPON7': '0.200', 'weapon4': '0.268', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.681', 'ARMOR': '0.836', 'weapon2': '1.268', 'weapon3': '1.456', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:57:02,461][63454] Saving new best policy, reward=-1.587! +[2023-09-14 14:57:03,658][63806] DAMAGECOUNT value on done: 9583.0 +[2023-09-14 14:57:03,659][63806] Sum rewards: -2.526, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.232', 'AMMO2': '0.003', 'AMMO5': '0.013', 'AMMO4': '0.016', 'WEAPON1': '0.020', 'weapon5': '0.036', 'weapon4': '0.044', 'ARMOR': '0.076', 'AMMO3': '0.088', 'WEAPON4': '0.100', 'HITCOUNT': '0.130', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.048', 'weapon2': '2.332'} +[2023-09-14 14:57:03,983][63806] DAMAGECOUNT value on done: 8925.0 +[2023-09-14 14:57:03,984][63806] Sum rewards: -3.201, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.615', 'AMMO2': '0.006', 'WEAPON1': '0.010', 'AMMO5': '0.019', 'ARMOR': '0.024', 'AMMO4': '0.029', 'WEAPON4': '0.050', 'weapon5': '0.066', 'AMMO3': '0.129', 'HITCOUNT': '0.190', 'weapon4': '0.206', 'WEAPON5': '0.300', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.678', 'WEAPON3': '0.800', 'weapon2': '1.016', 'weapon3': '1.890'} +[2023-09-14 14:57:04,198][63733] Updated weights for policy 1, policy_version 1630 (0.0011) +[2023-09-14 14:57:05,050][63805] DAMAGECOUNT value on done: 10497.0 +[2023-09-14 14:57:05,050][63805] Sum rewards: -1.902, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.410', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'AMMO2': '0.026', 'weapon5': '0.054', 'weapon7': '0.096', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.114', 'AMMO4': '0.129', 'WEAPON4': '0.200', 'weapon4': '0.230', 'HITCOUNT': '0.240', 'DAMAGECOUNT': '0.840', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.236', 'weapon3': '1.794'} +[2023-09-14 14:57:05,352][63805] DAMAGECOUNT value on done: 10838.0 +[2023-09-14 14:57:05,352][63805] Sum rewards: 0.579, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.230', 'AMMO5': '0.020', 'ARMOR': '0.032', 'AMMO2': '0.038', 'weapon4': '0.056', 'WEAPON4': '0.100', 'AMMO3': '0.156', 'AMMO4': '0.187', 'weapon5': '0.284', 'HITCOUNT': '0.290', 'WEAPON5': '0.300', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.080', 'weapon2': '1.416', 'weapon3': '1.950', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:57:05,625][63732] Updated weights for policy 0, policy_version 1730 (0.0011) +[2023-09-14 14:57:06,391][63771] DAMAGECOUNT value on done: 10499.0 +[2023-09-14 14:57:06,392][63771] Sum rewards: -2.698, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.632', 'AMMO2': '0.001', 'AMMO4': '0.002', 'AMMO5': '0.014', 'WEAPON4': '0.050', 'AMMO3': '0.077', 'weapon4': '0.100', 'weapon5': '0.156', 'HITCOUNT': '0.190', 'WEAPON5': '0.350', 'ARMOR': '0.400', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.957', 'weapon3': '1.114', 'weapon2': '1.972'} +[2023-09-14 14:57:06,725][63771] DAMAGECOUNT value on done: 7588.0 +[2023-09-14 14:57:06,725][63771] Sum rewards: -0.021, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.097', 'WEAPON1': '0.010', 'AMMO2': '0.034', 'AMMO3': '0.069', 'AMMO4': '0.171', 'HITCOUNT': '0.200', 'weapon4': '0.258', 'WEAPON4': '0.350', 'ARMOR': '0.404', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.765', 'weapon3': '0.994', 'weapon2': '1.870', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:57:11,449][63732] Updated weights for policy 0, policy_version 1740 (0.0011) +[2023-09-14 14:57:13,723][63733] Updated weights for policy 1, policy_version 1640 (0.0010) +[2023-09-14 14:57:13,794][63770] DAMAGECOUNT value on done: 11110.0 +[2023-09-14 14:57:13,795][63770] Sum rewards: 1.927, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.650', 'AMMO5': '0.010', 'AMMO2': '0.016', 'weapon4': '0.050', 'AMMO4': '0.080', 'AMMO3': '0.110', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'weapon5': '0.228', 'HITCOUNT': '0.340', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.212', 'weapon2': '1.302', 'weapon3': '2.028', 'FRAGCOUNT': '6.000'} +[2023-09-14 14:57:13,909][63734] DAMAGECOUNT value on done: 9780.0 +[2023-09-14 14:57:14,136][63770] DAMAGECOUNT value on done: 7760.0 +[2023-09-14 14:57:14,305][63734] DAMAGECOUNT value on done: 9506.0 +[2023-09-14 14:57:14,305][63734] Sum rewards: -4.681, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.607', 'AMMO2': '0.014', 'AMMO5': '0.018', 'ARMOR': '0.028', 'weapon5': '0.034', 'WEAPON4': '0.050', 'AMMO4': '0.072', 'weapon4': '0.116', 'AMMO3': '0.194', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.612', 'WEAPON3': '1.100', 'weapon2': '1.444', 'weapon3': '2.084', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:57:14,914][63767] DAMAGECOUNT value on done: 10734.0 +[2023-09-14 14:57:14,914][63767] Sum rewards: 0.014, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.794', 'AMMO2': '0.002', 'AMMO4': '0.009', 'AMMO5': '0.013', 'ARMOR': '0.080', 'AMMO3': '0.084', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.120', 'weapon5': '0.124', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'weapon4': '0.308', 'HITCOUNT': '0.330', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.116', 'weapon2': '1.212', 'weapon3': '1.710', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:57:15,287][63767] DAMAGECOUNT value on done: 9859.0 +[2023-09-14 14:57:15,288][63767] Sum rewards: -4.166, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.625', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.010', 'AMMO2': '0.023', 'WEAPON1': '0.030', 'ARMOR': '0.056', 'AMMO4': '0.117', 'AMMO3': '0.138', 'weapon5': '0.150', 'WEAPON5': '0.200', 'weapon4': '0.238', 'WEAPON4': '0.250', 'HITCOUNT': '0.320', 'WEAPON3': '0.850', 'weapon2': '0.966', 'DAMAGECOUNT': '1.125', 'weapon3': '2.236'} +[2023-09-14 14:57:15,480][63735] DAMAGECOUNT value on done: 9092.0 +[2023-09-14 14:57:15,555][63805] DAMAGECOUNT value on done: 11093.0 +[2023-09-14 14:57:15,556][63805] Sum rewards: -2.355, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.052', 'AMMO5': '0.003', 'ARMOR': '0.004', 'WEAPON1': '0.010', 'weapon5': '0.022', 'AMMO2': '0.030', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'AMMO3': '0.122', 'AMMO4': '0.149', 'weapon4': '0.152', 'HITCOUNT': '0.270', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.930', 'FRAGCOUNT': '1.000', 'weapon2': '1.610', 'weapon3': '1.796'} +[2023-09-14 14:57:15,866][63805] DAMAGECOUNT value on done: 8098.0 +[2023-09-14 14:57:15,866][63805] Sum rewards: -1.402, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.438', 'AMMO5': '0.003', 'AMMO2': '0.021', 'WEAPON5': '0.050', 'HITCOUNT': '0.080', 'AMMO3': '0.087', 'ARMOR': '0.088', 'AMMO4': '0.105', 'WEAPON4': '0.200', 'weapon4': '0.368', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon3': '1.150', 'weapon2': '1.764'} +[2023-09-14 14:57:15,882][63735] DAMAGECOUNT value on done: 10966.0 +[2023-09-14 14:57:15,882][63735] Sum rewards: -5.230, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.147', 'AMMO5': '0.015', 'AMMO2': '0.019', 'ARMOR': '0.024', 'AMMO4': '0.094', 'weapon4': '0.128', 'AMMO3': '0.143', 'HITCOUNT': '0.180', 'weapon5': '0.186', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon7': '0.234', 'AMMO6': '0.300', 'WEAPON7': '0.300', 'AMMO7': '0.300', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.738', 'FRAGCOUNT': '1.000', 'weapon3': '1.568', 'weapon2': '1.638'} +[2023-09-14 14:57:16,130][63769] DAMAGECOUNT value on done: 10022.0 +[2023-09-14 14:57:16,131][63769] Sum rewards: -2.568, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.120', 'AMMO5': '0.013', 'weapon5': '0.014', 'AMMO2': '0.018', 'ARMOR': '0.052', 'AMMO4': '0.090', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.171', 'weapon4': '0.302', 'HITCOUNT': '0.380', 'WEAPON3': '1.050', 'weapon2': '1.212', 'DAMAGECOUNT': '1.620', 'weapon3': '1.930', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:57:16,542][63769] DAMAGECOUNT value on done: 9242.0 +[2023-09-14 14:57:16,934][63735] DAMAGECOUNT value on done: 9426.0 +[2023-09-14 14:57:16,934][63735] Sum rewards: -0.652, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.090', 'AMMO5': '0.015', 'ARMOR': '0.036', 'AMMO2': '0.040', 'AMMO3': '0.093', 'AMMO4': '0.198', 'WEAPON5': '0.250', 'weapon5': '0.266', 'HITCOUNT': '0.370', 'WEAPON4': '0.450', 'WEAPON3': '0.450', 'weapon4': '0.570', 'DAMAGECOUNT': '1.062', 'weapon3': '1.190', 'weapon2': '1.448', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:57:16,935][63806] DAMAGECOUNT value on done: 8172.0 +[2023-09-14 14:57:16,936][63806] Sum rewards: -1.257, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.915', 'AMMO5': '0.026', 'AMMO2': '0.030', 'ARMOR': '0.060', 'AMMO3': '0.113', 'AMMO4': '0.148', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'weapon4': '0.428', 'WEAPON5': '0.500', 'weapon5': '0.578', 'WEAPON3': '0.750', 'weapon3': '1.250', 'weapon2': '1.494', 'DAMAGECOUNT': '1.611', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:57:16,987][63734] DAMAGECOUNT value on done: 9335.0 +[2023-09-14 14:57:16,987][63734] Sum rewards: -7.574, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-4.260', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'AMMO2': '0.035', 'weapon5': '0.068', 'ARMOR': '0.092', 'WEAPON5': '0.100', 'AMMO3': '0.145', 'AMMO4': '0.172', 'HITCOUNT': '0.320', 'weapon4': '0.322', 'WEAPON4': '0.500', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.185', 'weapon2': '1.544', 'weapon3': '1.878', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:57:17,314][63735] DAMAGECOUNT value on done: 7505.0 +[2023-09-14 14:57:17,314][63735] Sum rewards: 0.684, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.725', 'AMMO2': '0.003', 'AMMO5': '0.007', 'AMMO4': '0.016', 'weapon5': '0.022', 'AMMO3': '0.109', 'WEAPON5': '0.150', 'weapon4': '0.186', 'WEAPON4': '0.250', 'ARMOR': '0.465', 'HITCOUNT': '0.490', 'WEAPON3': '0.750', 'weapon3': '1.714', 'DAMAGECOUNT': '1.740', 'weapon2': '1.756', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:57:17,324][63806] DAMAGECOUNT value on done: 9667.0 +[2023-09-14 14:57:17,337][63734] DAMAGECOUNT value on done: 7325.0 +[2023-09-14 14:57:17,338][63734] Sum rewards: -1.173, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.842', 'AMMO5': '0.010', 'AMMO2': '0.018', 'weapon5': '0.026', 'AMMO4': '0.089', 'AMMO3': '0.138', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.462', 'ARMOR': '0.504', 'DAMAGECOUNT': '0.600', 'weapon2': '0.692', 'WEAPON3': '0.900', 'weapon3': '1.900', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:57:17,605][63732] Updated weights for policy 0, policy_version 1750 (0.0010) +[2023-09-14 14:57:21,463][63733] Updated weights for policy 1, policy_version 1650 (0.0012) +[2023-09-14 14:57:23,099][63771] DAMAGECOUNT value on done: 7980.0 +[2023-09-14 14:57:23,100][63771] Sum rewards: -1.578, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.150', 'WEAPON1': '0.010', 'AMMO2': '0.019', 'AMMO5': '0.019', 'AMMO4': '0.094', 'AMMO3': '0.134', 'weapon4': '0.204', 'HITCOUNT': '0.250', 'WEAPON4': '0.300', 'WEAPON5': '0.350', 'weapon5': '0.426', 'WEAPON3': '0.700', 'weapon2': '1.330', 'FRAGCOUNT': '1.500', 'DAMAGECOUNT': '1.578', 'weapon3': '1.658'} +[2023-09-14 14:57:23,436][63769] DAMAGECOUNT value on done: 10311.0 +[2023-09-14 14:57:23,436][63769] Sum rewards: 2.870, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.070', 'AMMO2': '0.012', 'ARMOR': '0.054', 'AMMO4': '0.057', 'weapon7': '0.070', 'AMMO3': '0.115', 'WEAPON4': '0.200', 'weapon4': '0.220', 'AMMO6': '0.300', 'WEAPON7': '0.300', 'AMMO7': '0.300', 'HITCOUNT': '0.330', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.602', 'weapon3': '1.712', 'weapon2': '1.718', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:57:23,488][63771] DAMAGECOUNT value on done: 10374.0 +[2023-09-14 14:57:23,489][63771] Sum rewards: 1.157, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.307', 'AMMO2': '0.001', 'AMMO4': '0.004', 'AMMO5': '0.007', 'AMMO3': '0.092', 'weapon5': '0.120', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'WEAPON3': '0.350', 'ARMOR': '0.420', 'DAMAGECOUNT': '0.669', 'weapon3': '1.534', 'weapon2': '1.966', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:57:23,761][63767] DAMAGECOUNT value on done: 11259.0 +[2023-09-14 14:57:23,762][63767] Sum rewards: -3.560, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.266', 'WEAPON1': '0.010', 'AMMO2': '0.022', 'AMMO5': '0.025', 'AMMO3': '0.089', 'ARMOR': '0.106', 'AMMO4': '0.108', 'weapon5': '0.154', 'HITCOUNT': '0.210', 'WEAPON4': '0.300', 'WEAPON5': '0.350', 'FRAGCOUNT': '0.500', 'weapon4': '0.508', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.050', 'weapon2': '1.306', 'weapon3': '1.368'} +[2023-09-14 14:57:23,814][63769] DAMAGECOUNT value on done: 7475.0 +[2023-09-14 14:57:24,144][63767] DAMAGECOUNT value on done: 13054.0 +[2023-09-14 14:57:24,144][63767] Sum rewards: -0.961, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.442', 'AMMO5': '0.005', 'AMMO2': '0.010', 'AMMO4': '0.048', 'weapon7': '0.060', 'ARMOR': '0.092', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.151', 'WEAPON7': '0.200', 'WEAPON4': '0.250', 'HITCOUNT': '0.440', 'weapon4': '0.492', 'WEAPON3': '0.800', 'weapon2': '0.842', 'weapon3': '1.436', 'DAMAGECOUNT': '1.665', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:57:24,886][63732] Updated weights for policy 0, policy_version 1760 (0.0011) +[2023-09-14 14:57:25,393][63770] DAMAGECOUNT value on done: 8683.0 +[2023-09-14 14:57:25,394][63770] Sum rewards: 2.286, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.615', 'AMMO5': '0.003', 'AMMO2': '0.009', 'AMMO3': '0.040', 'AMMO4': '0.043', 'WEAPON5': '0.050', 'weapon5': '0.060', 'HITCOUNT': '0.200', 'WEAPON4': '0.250', 'WEAPON3': '0.250', 'weapon4': '0.466', 'DAMAGECOUNT': '0.579', 'ARMOR': '0.580', 'weapon3': '0.802', 'weapon2': '1.070', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:57:25,757][63770] DAMAGECOUNT value on done: 8379.0 +[2023-09-14 14:57:25,758][63770] Sum rewards: -2.863, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.558', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO2': '0.007', 'ARMOR': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.033', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.124', 'AMMO3': '0.141', 'HITCOUNT': '0.220', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.807', 'weapon2': '1.702', 'weapon3': '1.768', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:57:26,055][63806] DAMAGECOUNT value on done: 9737.0 +[2023-09-14 14:57:26,356][63806] DAMAGECOUNT value on done: 9100.0 +[2023-09-14 14:57:28,128][63805] DAMAGECOUNT value on done: 10537.0 +[2023-09-14 14:57:28,519][63805] DAMAGECOUNT value on done: 11289.0 +[2023-09-14 14:57:28,519][63805] Sum rewards: -0.565, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.406', 'WEAPON1': '0.010', 'AMMO2': '0.019', 'AMMO5': '0.026', 'ARMOR': '0.072', 'AMMO4': '0.096', 'AMMO3': '0.110', 'WEAPON4': '0.250', 'HITCOUNT': '0.250', 'weapon4': '0.412', 'weapon5': '0.444', 'WEAPON5': '0.450', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.600', 'weapon3': '1.248', 'DAMAGECOUNT': '1.353', 'weapon2': '1.500'} +[2023-09-14 14:57:28,636][63733] Updated weights for policy 1, policy_version 1660 (0.0011) +[2023-09-14 14:57:29,103][63771] DAMAGECOUNT value on done: 10532.0 +[2023-09-14 14:57:29,529][63771] DAMAGECOUNT value on done: 7732.0 +[2023-09-14 14:57:29,530][63771] Sum rewards: -1.461, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.356', 'AMMO2': '0.004', 'AMMO5': '0.014', 'WEAPON1': '0.020', 'AMMO4': '0.020', 'WEAPON4': '0.050', 'HITCOUNT': '0.080', 'AMMO3': '0.090', 'weapon4': '0.146', 'weapon5': '0.152', 'WEAPON3': '0.300', 'WEAPON5': '0.300', 'weapon3': '0.314', 'DAMAGECOUNT': '0.432', 'ARMOR': '0.940', 'FRAGCOUNT': '2.000', 'weapon2': '2.532'} +[2023-09-14 14:57:32,052][63732] Updated weights for policy 0, policy_version 1770 (0.0011) +[2023-09-14 14:57:35,985][63733] Updated weights for policy 1, policy_version 1670 (0.0011) +[2023-09-14 14:57:37,203][63734] DAMAGECOUNT value on done: 9977.0 +[2023-09-14 14:57:37,204][63734] Sum rewards: -1.565, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.370', 'AMMO4': '-0.004', 'AMMO2': '-0.001', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'WEAPON5': '0.050', 'weapon4': '0.062', 'weapon5': '0.072', 'AMMO3': '0.088', 'WEAPON4': '0.100', 'HITCOUNT': '0.180', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.591', 'FRAGCOUNT': '1.000', 'weapon3': '1.096', 'weapon2': '2.098'} +[2023-09-14 14:57:37,509][63767] DAMAGECOUNT value on done: 10841.0 +[2023-09-14 14:57:37,618][63734] DAMAGECOUNT value on done: 9750.0 +[2023-09-14 14:57:37,618][63734] Sum rewards: -7.249, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.562', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.014', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'AMMO4': '0.070', 'weapon5': '0.072', 'AMMO3': '0.080', 'weapon4': '0.098', 'HITCOUNT': '0.170', 'WEAPON4': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.450', 'ARMOR': '0.534', 'DAMAGECOUNT': '0.732', 'weapon3': '1.314', 'weapon2': '1.990'} +[2023-09-14 14:57:37,836][63767] DAMAGECOUNT value on done: 10299.0 +[2023-09-14 14:57:37,836][63767] Sum rewards: -2.972, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.572', 'AMMO2': '0.008', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.028', 'AMMO4': '0.042', 'weapon7': '0.090', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon5': '0.112', 'AMMO3': '0.152', 'WEAPON5': '0.250', 'HITCOUNT': '0.320', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.850', 'weapon2': '1.212', 'DAMAGECOUNT': '1.320', 'weapon3': '2.128'} +[2023-09-14 14:57:38,401][63805] DAMAGECOUNT value on done: 11134.0 +[2023-09-14 14:57:38,402][63805] Sum rewards: -4.335, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.195', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'weapon5': '0.038', 'HITCOUNT': '0.040', 'ARMOR': '0.088', 'weapon4': '0.098', 'DAMAGECOUNT': '0.123', 'AMMO3': '0.132', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.642', 'weapon2': '1.770'} +[2023-09-14 14:57:38,739][63805] DAMAGECOUNT value on done: 8513.0 +[2023-09-14 14:57:38,739][63805] Sum rewards: 1.364, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.670', 'AMMO2': '0.004', 'AMMO5': '0.010', 'AMMO4': '0.019', 'WEAPON1': '0.020', 'ARMOR': '0.060', 'AMMO3': '0.068', 'weapon5': '0.078', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'HITCOUNT': '0.310', 'weapon4': '0.318', 'WEAPON3': '0.450', 'DAMAGECOUNT': '1.245', 'weapon3': '1.286', 'weapon2': '1.966', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:57:39,355][63732] Updated weights for policy 0, policy_version 1780 (0.0011) +[2023-09-14 14:57:39,442][63770] DAMAGECOUNT value on done: 11393.0 +[2023-09-14 14:57:39,443][63770] Sum rewards: -1.901, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.370', 'AMMO2': '0.007', 'AMMO5': '0.015', 'WEAPON1': '0.030', 'AMMO4': '0.032', 'AMMO3': '0.104', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'weapon5': '0.328', 'ARMOR': '0.460', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.849', 'weapon3': '1.560', 'weapon2': '1.694'} +[2023-09-14 14:57:39,565][63769] DAMAGECOUNT value on done: 10216.0 +[2023-09-14 14:57:39,565][63769] Sum rewards: -2.864, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.800', 'AMMO2': '0.006', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.029', 'WEAPON4': '0.100', 'AMMO3': '0.109', 'weapon4': '0.110', 'weapon5': '0.112', 'WEAPON5': '0.150', 'HITCOUNT': '0.210', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.582', 'FRAGCOUNT': '1.000', 'weapon3': '1.138', 'weapon2': '2.062'} +[2023-09-14 14:57:39,826][63770] DAMAGECOUNT value on done: 7960.0 +[2023-09-14 14:57:39,827][63770] Sum rewards: -2.257, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.802', 'AMMO5': '0.013', 'AMMO2': '0.013', 'WEAPON1': '0.030', 'AMMO4': '0.062', 'ARMOR': '0.078', 'AMMO3': '0.083', 'HITCOUNT': '0.150', 'weapon5': '0.162', 'weapon4': '0.196', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.182', 'weapon2': '1.626'} +[2023-09-14 14:57:39,941][63769] DAMAGECOUNT value on done: 9502.0 +[2023-09-14 14:57:39,941][63769] Sum rewards: -4.631, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.452', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'weapon5': '0.014', 'AMMO2': '0.026', 'WEAPON5': '0.050', 'ARMOR': '0.068', 'AMMO4': '0.131', 'AMMO3': '0.147', 'weapon4': '0.234', 'HITCOUNT': '0.260', 'WEAPON4': '0.350', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.780', 'weapon2': '1.586', 'weapon3': '1.662'} +[2023-09-14 14:57:40,355][63734] DAMAGECOUNT value on done: 9802.0 +[2023-09-14 14:57:40,355][63734] Sum rewards: -3.063, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.982', 'AMMO5': '0.010', 'ARMOR': '0.028', 'AMMO2': '0.033', 'AMMO3': '0.129', 'AMMO4': '0.165', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'weapon4': '0.328', 'HITCOUNT': '0.340', 'weapon5': '0.474', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.750', 'weapon2': '1.384', 'DAMAGECOUNT': '1.401', 'weapon3': '1.576'} +[2023-09-14 14:57:40,512][63735] DAMAGECOUNT value on done: 9347.0 +[2023-09-14 14:57:40,513][63735] Sum rewards: -1.275, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.235', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.013', 'weapon5': '0.026', 'WEAPON1': '0.030', 'AMMO3': '0.078', 'ARMOR': '0.092', 'WEAPON4': '0.100', 'HITCOUNT': '0.160', 'weapon4': '0.166', 'WEAPON5': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.765', 'weapon3': '1.508', 'weapon2': '1.736', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:57:40,672][63734] DAMAGECOUNT value on done: 7595.0 +[2023-09-14 14:57:40,673][63734] Sum rewards: -2.166, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.360', 'AMMO2': '0.005', 'AMMO5': '0.013', 'AMMO4': '0.025', 'ARMOR': '0.072', 'AMMO3': '0.140', 'weapon5': '0.154', 'weapon4': '0.226', 'WEAPON4': '0.250', 'HITCOUNT': '0.280', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.810', 'WEAPON3': '0.950', 'weapon2': '1.564', 'weapon3': '1.654', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:57:40,892][63735] DAMAGECOUNT value on done: 11367.0 +[2023-09-14 14:57:40,892][63735] Sum rewards: 0.172, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.130', 'AMMO2': '0.010', 'AMMO5': '0.015', 'AMMO4': '0.052', 'AMMO3': '0.094', 'weapon5': '0.100', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'weapon4': '0.308', 'HITCOUNT': '0.410', 'ARMOR': '0.432', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.203', 'weapon2': '1.606', 'weapon3': '1.772'} +[2023-09-14 14:57:41,941][63806] DAMAGECOUNT value on done: 8186.0 +[2023-09-14 14:57:42,036][63735] DAMAGECOUNT value on done: 9823.0 +[2023-09-14 14:57:42,037][63735] Sum rewards: -1.371, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.758', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'AMMO2': '0.021', 'ARMOR': '0.048', 'AMMO3': '0.099', 'AMMO4': '0.104', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'weapon5': '0.378', 'weapon4': '0.454', 'WEAPON3': '0.550', 'weapon2': '1.030', 'DAMAGECOUNT': '1.191', 'weapon3': '1.714', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:57:42,329][63806] DAMAGECOUNT value on done: 10113.0 +[2023-09-14 14:57:42,329][63806] Sum rewards: -0.974, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.290', 'weapon5': '0.002', 'AMMO5': '0.010', 'ARMOR': '0.012', 'AMMO2': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.073', 'AMMO3': '0.104', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'weapon4': '0.208', 'HITCOUNT': '0.310', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.338', 'weapon2': '1.606', 'weapon3': '1.768', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:57:42,449][63735] DAMAGECOUNT value on done: 7966.0 +[2023-09-14 14:57:42,450][63735] Sum rewards: -0.183, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.244', 'AMMO2': '0.011', 'AMMO5': '0.013', 'ARMOR': '0.028', 'WEAPON1': '0.040', 'AMMO4': '0.056', 'weapon5': '0.084', 'WEAPON4': '0.100', 'AMMO3': '0.121', 'HITCOUNT': '0.230', 'WEAPON5': '0.300', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.380', 'weapon2': '1.534', 'weapon3': '1.814', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:57:43,289][63733] Updated weights for policy 1, policy_version 1680 (0.0011) +[2023-09-14 14:57:46,237][63771] DAMAGECOUNT value on done: 8687.0 +[2023-09-14 14:57:46,238][63771] Sum rewards: -3.165, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.444', 'AMMO2': '0.015', 'ARMOR': '0.028', 'WEAPON1': '0.030', 'AMMO5': '0.035', 'WEAPON4': '0.050', 'AMMO4': '0.074', 'AMMO3': '0.130', 'weapon4': '0.150', 'weapon5': '0.248', 'HITCOUNT': '0.450', 'WEAPON5': '0.550', 'WEAPON3': '0.750', 'weapon2': '1.330', 'FRAGCOUNT': '1.500', 'weapon3': '1.818', 'DAMAGECOUNT': '2.121'} +[2023-09-14 14:57:46,320][63767] DAMAGECOUNT value on done: 11513.0 +[2023-09-14 14:57:46,321][63767] Sum rewards: 1.427, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.015', 'AMMO2': '0.023', 'WEAPON4': '0.050', 'weapon7': '0.058', 'AMMO3': '0.100', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'weapon4': '0.102', 'AMMO4': '0.115', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'weapon5': '0.300', 'ARMOR': '0.408', 'WEAPON3': '0.550', 'HEALTH': '0.578', 'DAMAGECOUNT': '0.762', 'weapon2': '1.434', 'weapon3': '1.662', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:57:46,585][63732] Updated weights for policy 0, policy_version 1790 (0.0011) +[2023-09-14 14:57:46,603][63771] DAMAGECOUNT value on done: 11057.0 +[2023-09-14 14:57:46,603][63771] Sum rewards: 0.437, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.764', 'AMMO2': '0.008', 'WEAPON1': '0.020', 'AMMO5': '0.030', 'AMMO4': '0.040', 'AMMO3': '0.166', 'weapon5': '0.354', 'ARMOR': '0.400', 'WEAPON5': '0.500', 'HITCOUNT': '0.510', 'WEAPON3': '0.850', 'weapon2': '1.188', 'DAMAGECOUNT': '2.049', 'weapon3': '2.086', 'FRAGCOUNT': '3.500'} +[2023-09-14 14:57:46,687][63767] DAMAGECOUNT value on done: 13472.0 +[2023-09-14 14:57:46,688][63767] Sum rewards: 1.548, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.406', 'AMMO5': '0.015', 'weapon7': '0.024', 'AMMO2': '0.028', 'ARMOR': '0.072', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.114', 'AMMO4': '0.140', 'weapon5': '0.150', 'WEAPON4': '0.250', 'WEAPON5': '0.250', 'weapon4': '0.286', 'HITCOUNT': '0.350', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.254', 'weapon2': '1.572', 'weapon3': '1.648', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:57:48,921][63769] DAMAGECOUNT value on done: 10580.0 +[2023-09-14 14:57:48,922][63769] Sum rewards: -3.035, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.162', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.001', 'AMMO4': '0.005', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'WEAPON4': '0.150', 'AMMO3': '0.151', 'HITCOUNT': '0.160', 'weapon4': '0.214', 'weapon5': '0.300', 'WEAPON5': '0.400', 'ARMOR': '0.516', 'weapon2': '0.592', 'DAMAGECOUNT': '0.807', 'WEAPON3': '0.850', 'weapon3': '2.192'} +[2023-09-14 14:57:49,068][63806] DAMAGECOUNT value on done: 9886.0 +[2023-09-14 14:57:49,068][63806] Sum rewards: -5.953, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.110', 'AMMO5': '0.003', 'AMMO2': '0.020', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'WEAPON5': '0.050', 'AMMO4': '0.098', 'AMMO3': '0.138', 'HITCOUNT': '0.150', 'weapon4': '0.244', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.447', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.494', 'weapon3': '1.812'} +[2023-09-14 14:57:49,313][63769] DAMAGECOUNT value on done: 7650.0 +[2023-09-14 14:57:49,314][63769] Sum rewards: -3.527, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.226', 'AMMO5': '0.005', 'AMMO2': '0.021', 'AMMO3': '0.080', 'ARMOR': '0.092', 'weapon5': '0.094', 'WEAPON5': '0.100', 'AMMO4': '0.105', 'weapon4': '0.128', 'HITCOUNT': '0.150', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.525', 'weapon3': '1.282', 'FRAGCOUNT': '2.000', 'weapon2': '2.016'} +[2023-09-14 14:57:49,393][63806] DAMAGECOUNT value on done: 9360.0 +[2023-09-14 14:57:49,394][63806] Sum rewards: -3.098, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.100', 'AMMO5': '0.007', 'AMMO2': '0.023', 'ARMOR': '0.048', 'weapon5': '0.056', 'AMMO3': '0.091', 'WEAPON4': '0.100', 'AMMO4': '0.116', 'WEAPON5': '0.150', 'HITCOUNT': '0.230', 'weapon4': '0.294', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.780', 'weapon3': '1.568', 'weapon2': '1.688', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:57:50,396][63733] Updated weights for policy 1, policy_version 1690 (0.0011) +[2023-09-14 14:57:50,977][63805] DAMAGECOUNT value on done: 10671.0 +[2023-09-14 14:57:50,978][63805] Sum rewards: -0.488, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.190', 'AMMO4': '-0.036', 'AMMO2': '-0.007', 'AMMO5': '0.007', 'HITCOUNT': '0.060', 'AMMO3': '0.070', 'ARMOR': '0.072', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon5': '0.134', 'weapon7': '0.146', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.402', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.194', 'weapon2': '1.910'} +[2023-09-14 14:57:51,234][63770] DAMAGECOUNT value on done: 8883.0 +[2023-09-14 14:57:51,323][63805] DAMAGECOUNT value on done: 11697.0 +[2023-09-14 14:57:51,324][63805] Sum rewards: -0.251, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.713', 'AMMO2': '0.009', 'AMMO5': '0.020', 'AMMO4': '0.047', 'AMMO3': '0.107', 'weapon7': '0.190', 'HITCOUNT': '0.200', 'AMMO6': '0.220', 'AMMO7': '0.220', 'WEAPON5': '0.250', 'weapon5': '0.286', 'WEAPON7': '0.300', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.224', 'weapon2': '1.552', 'weapon3': '1.736'} +[2023-09-14 14:57:51,628][63770] DAMAGECOUNT value on done: 8934.0 +[2023-09-14 14:57:51,629][63770] Sum rewards: 4.116, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.152', 'AMMO5': '0.010', 'AMMO2': '0.021', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'AMMO4': '0.104', 'AMMO3': '0.166', 'weapon4': '0.212', 'weapon5': '0.222', 'HITCOUNT': '0.430', 'ARMOR': '0.848', 'weapon2': '0.862', 'WEAPON3': '0.950', 'DAMAGECOUNT': '1.665', 'weapon3': '1.878', 'FRAGCOUNT': '6.000'} +[2023-09-14 14:57:52,026][63771] DAMAGECOUNT value on done: 10797.0 +[2023-09-14 14:57:52,342][63771] DAMAGECOUNT value on done: 8057.0 +[2023-09-14 14:57:52,343][63771] Sum rewards: -7.340, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.901', 'AMMO5': '0.005', 'AMMO2': '0.013', 'WEAPON1': '0.050', 'AMMO4': '0.067', 'WEAPON5': '0.100', 'AMMO3': '0.177', 'HITCOUNT': '0.260', 'DAMAGECOUNT': '0.975', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.100', 'weapon2': '1.614', 'weapon3': '1.950'} +[2023-09-14 14:57:53,695][63732] Updated weights for policy 0, policy_version 1800 (0.0011) +[2023-09-14 14:57:57,666][63733] Updated weights for policy 1, policy_version 1700 (0.0010) +[2023-09-14 14:57:59,837][63767] DAMAGECOUNT value on done: 11276.0 +[2023-09-14 14:57:59,837][63767] Sum rewards: -2.091, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.568', 'AMMO2': '0.021', 'AMMO5': '0.023', 'ARMOR': '0.044', 'weapon5': '0.066', 'AMMO4': '0.106', 'AMMO3': '0.178', 'HITCOUNT': '0.380', 'WEAPON4': '0.400', 'WEAPON5': '0.400', 'weapon4': '0.484', 'WEAPON3': '1.150', 'weapon2': '1.158', 'DAMAGECOUNT': '1.305', 'weapon3': '2.012', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:58:00,221][63767] DAMAGECOUNT value on done: 10509.0 +[2023-09-14 14:58:00,222][63767] Sum rewards: -4.359, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.148', 'AMMO2': '0.012', 'AMMO5': '0.015', 'weapon5': '0.028', 'ARMOR': '0.040', 'AMMO4': '0.061', 'weapon4': '0.086', 'WEAPON4': '0.100', 'AMMO3': '0.141', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.750', 'weapon3': '1.706', 'weapon2': '1.850', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:58:00,231][63734] DAMAGECOUNT value on done: 10247.0 +[2023-09-14 14:58:00,232][63734] Sum rewards: -4.171, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.658', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.010', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'weapon5': '0.032', 'AMMO4': '0.051', 'ARMOR': '0.060', 'WEAPON4': '0.150', 'AMMO3': '0.156', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'weapon4': '0.288', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.810', 'weapon2': '1.090', 'weapon3': '1.624'} +[2023-09-14 14:58:00,560][63734] DAMAGECOUNT value on done: 9933.0 +[2023-09-14 14:58:00,560][63734] Sum rewards: -7.336, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-3.058', 'AMMO5': '0.005', 'AMMO2': '0.021', 'weapon5': '0.032', 'ARMOR': '0.036', 'WEAPON5': '0.100', 'AMMO4': '0.105', 'AMMO3': '0.133', 'HITCOUNT': '0.180', 'weapon4': '0.182', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.549', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.384', 'weapon3': '2.044'} +[2023-09-14 14:58:00,932][63732] Updated weights for policy 0, policy_version 1810 (0.0010) +[2023-09-14 14:58:01,339][63805] DAMAGECOUNT value on done: 11523.0 +[2023-09-14 14:58:01,339][63805] Sum rewards: -2.501, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.646', 'AMMO4': '-0.064', 'AMMO2': '-0.013', 'AMMO5': '0.016', 'WEAPON1': '0.020', 'ARMOR': '0.068', 'weapon5': '0.116', 'AMMO3': '0.140', 'WEAPON5': '0.200', 'HITCOUNT': '0.330', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.167', 'weapon2': '1.550', 'weapon3': '1.864', 'FRAGCOUNT': '3.500'} +[2023-09-14 14:58:01,724][63805] DAMAGECOUNT value on done: 8887.0 +[2023-09-14 14:58:01,724][63805] Sum rewards: -7.069, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.548', 'AMMO5': '0.007', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'AMMO4': '0.038', 'WEAPON5': '0.050', 'ARMOR': '0.096', 'AMMO3': '0.154', 'HITCOUNT': '0.360', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.122', 'weapon3': '1.718', 'weapon2': '1.816'} +[2023-09-14 14:58:03,088][63769] DAMAGECOUNT value on done: 10281.0 +[2023-09-14 14:58:03,414][63734] DAMAGECOUNT value on done: 9937.0 +[2023-09-14 14:58:03,415][63734] Sum rewards: 0.282, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.050', 'AMMO2': '0.005', 'WEAPON1': '0.020', 'AMMO5': '0.020', 'AMMO4': '0.022', 'ARMOR': '0.074', 'WEAPON4': '0.100', 'HITCOUNT': '0.140', 'AMMO3': '0.142', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.405', 'weapon5': '0.416', 'WEAPON3': '0.750', 'weapon2': '1.284', 'weapon3': '1.754', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:58:03,418][63769] DAMAGECOUNT value on done: 9788.0 +[2023-09-14 14:58:03,419][63769] Sum rewards: 0.799, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.718', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.019', 'AMMO3': '0.125', 'HITCOUNT': '0.140', 'WEAPON5': '0.250', 'weapon5': '0.264', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.858', 'weapon3': '1.374', 'weapon2': '1.710', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:58:03,749][63734] DAMAGECOUNT value on done: 8073.0 +[2023-09-14 14:58:03,749][63734] Sum rewards: -1.559, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.886', 'AMMO5': '0.010', 'AMMO2': '0.014', 'AMMO4': '0.070', 'WEAPON4': '0.100', 'weapon5': '0.102', 'AMMO3': '0.134', 'WEAPON5': '0.200', 'weapon4': '0.254', 'HITCOUNT': '0.330', 'ARMOR': '0.408', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.434', 'FRAGCOUNT': '1.500', 'weapon2': '1.592', 'weapon3': '1.628'} +[2023-09-14 14:58:05,020][63733] Updated weights for policy 1, policy_version 1710 (0.0013) +[2023-09-14 14:58:05,215][63770] DAMAGECOUNT value on done: 11553.0 +[2023-09-14 14:58:05,216][63770] Sum rewards: -7.476, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-2.040', 'WEAPON1': '0.010', 'AMMO2': '0.016', 'AMMO5': '0.025', 'ARMOR': '0.032', 'AMMO4': '0.079', 'AMMO3': '0.168', 'HITCOUNT': '0.170', 'WEAPON4': '0.250', 'weapon5': '0.278', 'weapon4': '0.352', 'DAMAGECOUNT': '0.480', 'WEAPON5': '0.500', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '1.362', 'weapon2': '1.642'} +[2023-09-14 14:58:05,455][63735] DAMAGECOUNT value on done: 9362.0 +[2023-09-14 14:58:05,577][63770] DAMAGECOUNT value on done: 8044.0 +[2023-09-14 14:58:05,578][63770] Sum rewards: 0.439, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.989', 'AMMO2': '0.005', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.026', 'ARMOR': '0.068', 'AMMO3': '0.079', 'HITCOUNT': '0.080', 'weapon5': '0.114', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.252', 'WEAPON3': '0.550', 'weapon3': '1.358', 'weapon2': '1.968', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:58:05,815][63735] DAMAGECOUNT value on done: 11472.0 +[2023-09-14 14:58:05,815][63735] Sum rewards: -1.561, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.110', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.020', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.075', 'AMMO4': '0.098', 'weapon5': '0.174', 'AMMO6': '0.200', 'AMMO7': '0.200', 'WEAPON7': '0.200', 'weapon7': '0.250', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.400', 'weapon3': '0.944', 'FRAGCOUNT': '1.000', 'weapon2': '1.258'} +[2023-09-14 14:58:06,826][63806] DAMAGECOUNT value on done: 8495.0 +[2023-09-14 14:58:06,826][63806] Sum rewards: 0.075, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.717', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'AMMO2': '0.022', 'ARMOR': '0.024', 'weapon7': '0.094', 'AMMO4': '0.112', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.124', 'WEAPON7': '0.200', 'weapon5': '0.230', 'HITCOUNT': '0.270', 'WEAPON5': '0.300', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.927', 'weapon2': '1.336', 'weapon3': '2.130', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:58:06,913][63735] DAMAGECOUNT value on done: 10083.0 +[2023-09-14 14:58:06,913][63735] Sum rewards: -1.707, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.496', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'ARMOR': '0.032', 'WEAPON5': '0.050', 'AMMO4': '0.057', 'weapon5': '0.122', 'AMMO3': '0.164', 'HITCOUNT': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.780', 'weapon2': '1.432', 'weapon3': '2.078', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:58:07,213][63806] DAMAGECOUNT value on done: 10233.0 +[2023-09-14 14:58:07,388][63735] DAMAGECOUNT value on done: 8039.0 +[2023-09-14 14:58:08,140][63732] Updated weights for policy 0, policy_version 1820 (0.0011) +[2023-09-14 14:58:08,622][63767] DAMAGECOUNT value on done: 12028.0 +[2023-09-14 14:58:08,623][63767] Sum rewards: 1.619, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.418', 'AMMO2': '0.007', 'AMMO5': '0.007', 'AMMO4': '0.032', 'weapon4': '0.036', 'WEAPON4': '0.100', 'ARMOR': '0.104', 'AMMO3': '0.117', 'WEAPON5': '0.150', 'weapon5': '0.244', 'HITCOUNT': '0.340', 'WEAPON3': '0.800', 'weapon2': '1.160', 'DAMAGECOUNT': '1.545', 'weapon3': '1.894', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:58:08,999][63767] DAMAGECOUNT value on done: 13682.0 +[2023-09-14 14:58:09,000][63767] Sum rewards: -1.119, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.736', 'AMMO2': '0.003', 'AMMO4': '0.016', 'AMMO3': '0.140', 'HITCOUNT': '0.180', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.630', 'weapon2': '1.372', 'weapon3': '1.426', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:58:09,073][63771] DAMAGECOUNT value on done: 8975.0 +[2023-09-14 14:58:09,074][63771] Sum rewards: -2.196, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.858', 'AMMO2': '0.019', 'AMMO5': '0.020', 'WEAPON4': '0.050', 'weapon4': '0.072', 'AMMO4': '0.096', 'AMMO3': '0.140', 'HITCOUNT': '0.230', 'WEAPON5': '0.250', 'ARMOR': '0.416', 'weapon5': '0.426', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.864', 'FRAGCOUNT': '1.000', 'weapon2': '1.546', 'weapon3': '1.732'} +[2023-09-14 14:58:09,419][63771] DAMAGECOUNT value on done: 11487.0 +[2023-09-14 14:58:09,420][63771] Sum rewards: 1.211, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.839', 'AMMO5': '0.012', 'AMMO2': '0.029', 'WEAPON4': '0.050', 'AMMO3': '0.140', 'weapon4': '0.146', 'AMMO4': '0.146', 'WEAPON5': '0.250', 'weapon5': '0.262', 'HITCOUNT': '0.320', 'WEAPON3': '0.750', 'ARMOR': '0.800', 'DAMAGECOUNT': '1.290', 'weapon2': '1.440', 'weapon3': '1.664', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:58:11,970][63806] DAMAGECOUNT value on done: 10156.0 +[2023-09-14 14:58:11,971][63806] Sum rewards: -0.506, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.204', 'AMMO5': '0.010', 'AMMO2': '0.010', 'ARMOR': '0.040', 'WEAPON1': '0.040', 'AMMO4': '0.050', 'AMMO3': '0.090', 'weapon5': '0.128', 'WEAPON5': '0.200', 'HITCOUNT': '0.220', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.810', 'weapon3': '1.256', 'weapon2': '1.844', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:58:12,262][63733] Updated weights for policy 1, policy_version 1720 (0.0011) +[2023-09-14 14:58:12,358][63806] DAMAGECOUNT value on done: 9820.0 +[2023-09-14 14:58:12,358][63806] Sum rewards: -1.146, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.662', 'AMMO5': '0.005', 'AMMO2': '0.012', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.059', 'weapon5': '0.066', 'weapon4': '0.130', 'AMMO3': '0.152', 'HITCOUNT': '0.320', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.380', 'weapon2': '1.474', 'weapon3': '1.768', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:58:12,500][63454] Saving new best policy, reward=-1.556! +[2023-09-14 14:58:13,977][63805] DAMAGECOUNT value on done: 10917.0 +[2023-09-14 14:58:13,977][63805] Sum rewards: -0.731, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.752', 'AMMO2': '0.009', 'AMMO5': '0.009', 'AMMO4': '0.042', 'ARMOR': '0.064', 'WEAPON5': '0.150', 'AMMO3': '0.161', 'weapon5': '0.182', 'HITCOUNT': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'DAMAGECOUNT': '0.738', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.346', 'weapon3': '2.270'} +[2023-09-14 14:58:14,361][63805] DAMAGECOUNT value on done: 12235.0 +[2023-09-14 14:58:14,362][63805] Sum rewards: 1.472, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.100', 'AMMO4': '-0.019', 'AMMO2': '-0.004', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'weapon5': '0.114', 'AMMO3': '0.131', 'WEAPON5': '0.300', 'HITCOUNT': '0.380', 'WEAPON3': '0.800', 'weapon2': '1.132', 'DAMAGECOUNT': '1.614', 'weapon3': '2.346', 'FRAGCOUNT': '2.500'} +[2023-09-14 14:58:14,415][63769] DAMAGECOUNT value on done: 10764.0 +[2023-09-14 14:58:14,416][63769] Sum rewards: -1.969, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.479', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.008', 'weapon5': '0.062', 'weapon4': '0.098', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'ARMOR': '0.116', 'AMMO3': '0.133', 'HITCOUNT': '0.190', 'DAMAGECOUNT': '0.552', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.530', 'weapon3': '1.582'} +[2023-09-14 14:58:14,840][63769] DAMAGECOUNT value on done: 7837.0 +[2023-09-14 14:58:14,840][63769] Sum rewards: -3.457, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.290', 'AMMO2': '0.003', 'AMMO5': '0.005', 'AMMO4': '0.016', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'WEAPON4': '0.100', 'AMMO3': '0.107', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'weapon4': '0.178', 'weapon5': '0.208', 'DAMAGECOUNT': '0.561', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.390', 'weapon3': '1.488'} +[2023-09-14 14:58:14,844][63771] DAMAGECOUNT value on done: 11002.0 +[2023-09-14 14:58:14,845][63771] Sum rewards: -1.860, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.752', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'weapon4': '0.030', 'AMMO2': '0.032', 'WEAPON5': '0.050', 'ARMOR': '0.067', 'weapon5': '0.104', 'HITCOUNT': '0.160', 'AMMO4': '0.161', 'AMMO3': '0.164', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.615', 'WEAPON3': '1.000', 'weapon2': '1.484', 'weapon3': '1.762', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:58:15,224][63771] DAMAGECOUNT value on done: 8247.0 +[2023-09-14 14:58:15,225][63771] Sum rewards: -1.602, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.498', 'AMMO2': '0.017', 'AMMO5': '0.018', 'ARMOR': '0.036', 'weapon4': '0.044', 'WEAPON4': '0.050', 'weapon5': '0.086', 'AMMO4': '0.086', 'AMMO3': '0.115', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.570', 'WEAPON3': '0.700', 'weapon3': '1.382', 'weapon2': '1.662', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:58:15,338][63732] Updated weights for policy 0, policy_version 1830 (0.0011) +[2023-09-14 14:58:16,854][63770] DAMAGECOUNT value on done: 9076.0 +[2023-09-14 14:58:16,854][63770] Sum rewards: -0.069, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.256', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'AMMO2': '0.022', 'weapon5': '0.068', 'AMMO3': '0.085', 'ARMOR': '0.108', 'AMMO4': '0.108', 'HITCOUNT': '0.130', 'WEAPON4': '0.200', 'weapon4': '0.250', 'WEAPON5': '0.300', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.579', 'FRAGCOUNT': '1.000', 'weapon2': '1.248', 'weapon3': '1.614'} +[2023-09-14 14:58:17,204][63770] DAMAGECOUNT value on done: 9424.0 +[2023-09-14 14:58:17,205][63770] Sum rewards: 0.767, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.282', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.035', 'ARMOR': '0.060', 'AMMO3': '0.165', 'WEAPON5': '0.200', 'weapon5': '0.204', 'HITCOUNT': '0.420', 'WEAPON3': '0.850', 'weapon2': '1.140', 'DAMAGECOUNT': '1.470', 'weapon3': '2.476', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:58:17,469][63454] Saving new best policy, reward=-1.414! +[2023-09-14 14:58:19,508][63733] Updated weights for policy 1, policy_version 1730 (0.0012) +[2023-09-14 14:58:22,577][63767] DAMAGECOUNT value on done: 11643.0 +[2023-09-14 14:58:22,578][63767] Sum rewards: -7.198, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-0.886', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.022', 'ARMOR': '0.064', 'WEAPON5': '0.150', 'weapon5': '0.184', 'AMMO3': '0.223', 'HITCOUNT': '0.310', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.101', 'weapon2': '1.288', 'WEAPON3': '1.300', 'weapon3': '2.284'} +[2023-09-14 14:58:22,662][63732] Updated weights for policy 0, policy_version 1840 (0.0011) +[2023-09-14 14:58:22,957][63767] DAMAGECOUNT value on done: 11412.0 +[2023-09-14 14:58:22,957][63767] Sum rewards: 6.838, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.557', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'AMMO5': '0.010', 'weapon6': '0.056', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON6': '0.100', 'ARMOR': '0.116', 'AMMO3': '0.135', 'WEAPON5': '0.150', 'weapon5': '0.152', 'HITCOUNT': '0.640', 'WEAPON3': '0.800', 'weapon2': '1.314', 'weapon3': '2.270', 'DAMAGECOUNT': '2.709', 'FRAGCOUNT': '7.000'} +[2023-09-14 14:58:23,112][63734] DAMAGECOUNT value on done: 10437.0 +[2023-09-14 14:58:23,428][63734] DAMAGECOUNT value on done: 10208.0 +[2023-09-14 14:58:23,428][63734] Sum rewards: -0.453, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.720', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.015', 'AMMO4': '0.074', 'WEAPON5': '0.100', 'ARMOR': '0.122', 'AMMO3': '0.124', 'WEAPON4': '0.150', 'HITCOUNT': '0.210', 'weapon4': '0.214', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.825', 'FRAGCOUNT': '1.000', 'weapon3': '1.330', 'weapon2': '1.488'} +[2023-09-14 14:58:24,066][63805] DAMAGECOUNT value on done: 11688.0 +[2023-09-14 14:58:24,425][63805] DAMAGECOUNT value on done: 9073.0 +[2023-09-14 14:58:24,426][63805] Sum rewards: -3.105, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.529', 'AMMO5': '0.010', 'weapon5': '0.012', 'AMMO2': '0.015', 'WEAPON1': '0.040', 'AMMO4': '0.072', 'AMMO3': '0.122', 'weapon4': '0.130', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.558', 'ARMOR': '0.569', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.206', 'weapon2': '1.680'} +[2023-09-14 14:58:26,293][63769] DAMAGECOUNT value on done: 10566.0 +[2023-09-14 14:58:26,294][63769] Sum rewards: -1.993, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.182', 'AMMO4': '-0.028', 'AMMO2': '-0.006', 'AMMO5': '0.007', 'weapon5': '0.012', 'WEAPON1': '0.040', 'AMMO3': '0.101', 'WEAPON5': '0.150', 'HITCOUNT': '0.190', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.855', 'weapon3': '1.560', 'weapon2': '1.656', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:58:26,548][63734] DAMAGECOUNT value on done: 10097.0 +[2023-09-14 14:58:26,548][63734] Sum rewards: -4.062, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.720', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'AMMO5': '0.005', 'ARMOR': '0.032', 'HITCOUNT': '0.070', 'weapon7': '0.070', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.141', 'WEAPON5': '0.150', 'weapon5': '0.242', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.500', 'weapon3': '0.692', 'FRAGCOUNT': '1.000', 'weapon2': '2.244'} +[2023-09-14 14:58:26,644][63769] DAMAGECOUNT value on done: 9923.0 +[2023-09-14 14:58:26,644][63769] Sum rewards: -5.301, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.179', 'AMMO5': '0.005', 'AMMO2': '0.010', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'weapon5': '0.032', 'AMMO4': '0.051', 'HITCOUNT': '0.080', 'WEAPON5': '0.100', 'AMMO3': '0.146', 'DAMAGECOUNT': '0.405', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.650', 'weapon2': '1.652', 'weapon3': '1.702'} +[2023-09-14 14:58:26,720][63733] Updated weights for policy 1, policy_version 1740 (0.0011) +[2023-09-14 14:58:26,880][63734] DAMAGECOUNT value on done: 8241.0 +[2023-09-14 14:58:26,881][63734] Sum rewards: -1.159, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.336', 'AMMO2': '0.009', 'AMMO5': '0.010', 'AMMO4': '0.045', 'HITCOUNT': '0.120', 'AMMO3': '0.129', 'weapon5': '0.130', 'WEAPON5': '0.200', 'ARMOR': '0.472', 'DAMAGECOUNT': '0.504', 'WEAPON3': '0.900', 'weapon2': '1.400', 'weapon3': '2.258', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:58:27,465][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001741_7131136.pth... +[2023-09-14 14:58:27,466][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001846_7561216.pth... +[2023-09-14 14:58:27,520][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001428_5849088.pth +[2023-09-14 14:58:27,526][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001493_6115328.pth +[2023-09-14 14:58:27,533][63454] Saving new best policy, reward=-1.389! +[2023-09-14 14:58:29,915][63732] Updated weights for policy 0, policy_version 1850 (0.0011) +[2023-09-14 14:58:30,575][63735] DAMAGECOUNT value on done: 9587.0 +[2023-09-14 14:58:30,575][63735] Sum rewards: -3.874, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.150', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'ARMOR': '0.028', 'weapon5': '0.046', 'WEAPON5': '0.150', 'AMMO3': '0.171', 'HITCOUNT': '0.180', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.584', 'weapon2': '1.634'} +[2023-09-14 14:58:30,860][63770] DAMAGECOUNT value on done: 11700.0 +[2023-09-14 14:58:30,861][63770] Sum rewards: -1.212, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.951', 'AMMO5': '0.005', 'AMMO2': '0.014', 'weapon5': '0.036', 'AMMO4': '0.070', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.110', 'HITCOUNT': '0.130', 'weapon4': '0.182', 'DAMAGECOUNT': '0.441', 'ARMOR': '0.448', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.278', 'weapon3': '1.824'} +[2023-09-14 14:58:31,040][63735] DAMAGECOUNT value on done: 11739.0 +[2023-09-14 14:58:31,041][63735] Sum rewards: -0.915, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.106', 'AMMO5': '0.007', 'AMMO2': '0.020', 'WEAPON4': '0.050', 'ARMOR': '0.058', 'AMMO4': '0.098', 'WEAPON5': '0.100', 'weapon5': '0.132', 'AMMO3': '0.146', 'weapon4': '0.208', 'HITCOUNT': '0.230', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.801', 'weapon3': '1.152', 'weapon2': '2.038', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:58:31,294][63770] DAMAGECOUNT value on done: 8599.0 +[2023-09-14 14:58:31,294][63770] Sum rewards: -1.111, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.328', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'AMMO5': '0.023', 'WEAPON1': '0.030', 'weapon5': '0.030', 'ARMOR': '0.064', 'AMMO3': '0.169', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.350', 'HITCOUNT': '0.420', 'WEAPON3': '0.900', 'weapon2': '1.270', 'DAMAGECOUNT': '1.665', 'weapon3': '1.972', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:58:31,538][63806] DAMAGECOUNT value on done: 8880.0 +[2023-09-14 14:58:31,538][63806] Sum rewards: 4.913, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.600', 'AMMO5': '0.010', 'AMMO2': '0.012', 'ARMOR': '0.024', 'weapon5': '0.052', 'AMMO4': '0.059', 'AMMO3': '0.173', 'WEAPON5': '0.200', 'HITCOUNT': '0.280', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.155', 'weapon2': '1.570', 'weapon3': '2.128', 'FRAGCOUNT': '8.000'} +[2023-09-14 14:58:31,671][63767] DAMAGECOUNT value on done: 12253.0 +[2023-09-14 14:58:31,671][63767] Sum rewards: -3.785, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.632', 'AMMO2': '0.015', 'weapon4': '0.058', 'AMMO4': '0.074', 'AMMO3': '0.139', 'WEAPON4': '0.150', 'HITCOUNT': '0.210', 'ARMOR': '0.464', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.860', 'weapon3': '1.902'} +[2023-09-14 14:58:31,939][63806] DAMAGECOUNT value on done: 10350.0 +[2023-09-14 14:58:32,054][63767] DAMAGECOUNT value on done: 14298.0 +[2023-09-14 14:58:32,054][63767] Sum rewards: 2.401, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.044', 'AMMO2': '0.005', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'AMMO4': '0.027', 'ARMOR': '0.038', 'weapon5': '0.066', 'AMMO3': '0.157', 'WEAPON5': '0.200', 'HITCOUNT': '0.530', 'WEAPON3': '0.950', 'weapon2': '1.388', 'DAMAGECOUNT': '1.848', 'weapon3': '2.210', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:58:32,154][63771] DAMAGECOUNT value on done: 9390.0 +[2023-09-14 14:58:32,155][63771] Sum rewards: 0.697, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.198', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.014', 'weapon7': '0.024', 'ARMOR': '0.028', 'WEAPON4': '0.050', 'AMMO4': '0.068', 'weapon4': '0.084', 'AMMO3': '0.116', 'WEAPON5': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.340', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.245', 'weapon2': '1.704', 'weapon3': '1.904', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:58:32,230][63735] DAMAGECOUNT value on done: 10468.0 +[2023-09-14 14:58:32,230][63735] Sum rewards: 0.447, reward structure: {'DEATHCOUNT': '-8.250', 'weapon4': '0.004', 'AMMO2': '0.011', 'ARMOR': '0.012', 'AMMO5': '0.022', 'AMMO4': '0.056', 'WEAPON4': '0.100', 'AMMO3': '0.123', 'HEALTH': '0.175', 'weapon5': '0.204', 'WEAPON5': '0.350', 'HITCOUNT': '0.360', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.155', 'weapon2': '1.516', 'weapon3': '1.908', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:58:32,461][63454] Saving new best policy, reward=-1.286! +[2023-09-14 14:58:32,504][63771] DAMAGECOUNT value on done: 11822.0 +[2023-09-14 14:58:32,504][63771] Sum rewards: -3.497, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.677', 'AMMO2': '0.008', 'AMMO5': '0.010', 'ARMOR': '0.016', 'AMMO4': '0.039', 'weapon5': '0.070', 'WEAPON5': '0.150', 'AMMO3': '0.168', 'HITCOUNT': '0.380', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.005', 'weapon2': '1.738', 'weapon3': '2.046'} +[2023-09-14 14:58:32,656][63735] DAMAGECOUNT value on done: 8378.0 +[2023-09-14 14:58:32,657][63735] Sum rewards: -3.030, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.561', 'AMMO5': '0.005', 'ARMOR': '0.012', 'AMMO2': '0.015', 'AMMO4': '0.072', 'weapon4': '0.076', 'WEAPON5': '0.100', 'AMMO3': '0.150', 'WEAPON4': '0.200', 'HITCOUNT': '0.270', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.017', 'weapon3': '1.472', 'weapon2': '1.892', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:58:34,025][63733] Updated weights for policy 1, policy_version 1750 (0.0011) +[2023-09-14 14:58:34,505][63806] DAMAGECOUNT value on done: 10248.0 +[2023-09-14 14:58:34,918][63806] DAMAGECOUNT value on done: 9925.0 +[2023-09-14 14:58:36,928][63805] DAMAGECOUNT value on done: 11339.0 +[2023-09-14 14:58:36,929][63805] Sum rewards: 4.699, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.962', 'AMMO4': '-0.033', 'AMMO2': '-0.007', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'WEAPON4': '0.050', 'AMMO3': '0.069', 'weapon4': '0.178', 'WEAPON5': '0.300', 'HITCOUNT': '0.420', 'weapon5': '0.462', 'ARMOR': '0.487', 'WEAPON3': '0.500', 'weapon3': '1.244', 'DAMAGECOUNT': '1.266', 'weapon2': '1.700', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:58:37,166][63732] Updated weights for policy 0, policy_version 1860 (0.0011) +[2023-09-14 14:58:37,343][63805] DAMAGECOUNT value on done: 12835.0 +[2023-09-14 14:58:37,343][63805] Sum rewards: 2.588, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.510', 'AMMO2': '0.005', 'AMMO5': '0.017', 'AMMO4': '0.024', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'AMMO3': '0.133', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.266', 'WEAPON5': '0.350', 'HITCOUNT': '0.440', 'WEAPON3': '0.750', 'weapon3': '1.624', 'weapon2': '1.768', 'DAMAGECOUNT': '1.800', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:58:37,466][63454] Saving new best policy, reward=-1.213! +[2023-09-14 14:58:37,864][63771] DAMAGECOUNT value on done: 11192.0 +[2023-09-14 14:58:37,865][63771] Sum rewards: 0.664, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.615', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'AMMO3': '0.090', 'ARMOR': '0.092', 'weapon5': '0.094', 'WEAPON5': '0.100', 'HITCOUNT': '0.120', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.570', 'weapon2': '1.076', 'weapon3': '1.196', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:58:38,216][63771] DAMAGECOUNT value on done: 8257.0 +[2023-09-14 14:58:39,937][63769] DAMAGECOUNT value on done: 10909.0 +[2023-09-14 14:58:39,938][63769] Sum rewards: -2.006, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.384', 'AMMO2': '0.011', 'AMMO5': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.057', 'ARMOR': '0.069', 'AMMO3': '0.130', 'weapon5': '0.168', 'HITCOUNT': '0.180', 'weapon4': '0.220', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.800', 'weapon2': '0.884', 'FRAGCOUNT': '1.000', 'weapon3': '2.354'} +[2023-09-14 14:58:40,320][63769] DAMAGECOUNT value on done: 7926.0 +[2023-09-14 14:58:40,905][63806] Large shaping reward -2.534 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.28500000000000003, -95.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:58:41,428][63733] Updated weights for policy 1, policy_version 1760 (0.0012) +[2023-09-14 14:58:42,626][63770] DAMAGECOUNT value on done: 9247.0 +[2023-09-14 14:58:42,626][63770] Sum rewards: 0.185, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.372', 'AMMO2': '0.000', 'AMMO4': '0.002', 'AMMO5': '0.012', 'weapon5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.034', 'AMMO3': '0.088', 'HITCOUNT': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON5': '0.150', 'weapon7': '0.152', 'WEAPON7': '0.200', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.513', 'weapon3': '1.070', 'weapon2': '1.712', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:58:43,008][63770] DAMAGECOUNT value on done: 9780.0 +[2023-09-14 14:58:43,009][63770] Sum rewards: 3.938, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.556', 'AMMO2': '0.003', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO4': '0.014', 'WEAPON1': '0.020', 'WEAPON5': '0.100', 'AMMO3': '0.144', 'HITCOUNT': '0.270', 'ARMOR': '0.440', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.068', 'weapon2': '1.488', 'weapon3': '1.986', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:58:44,571][63732] Updated weights for policy 0, policy_version 1870 (0.0011) +[2023-09-14 14:58:45,503][63767] DAMAGECOUNT value on done: 12000.0 +[2023-09-14 14:58:45,504][63767] Sum rewards: -1.403, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.090', 'ARMOR': '0.008', 'WEAPON1': '0.020', 'AMMO5': '0.022', 'AMMO2': '0.036', 'AMMO3': '0.118', 'HITCOUNT': '0.160', 'AMMO4': '0.182', 'weapon5': '0.266', 'weapon4': '0.288', 'WEAPON4': '0.300', 'WEAPON5': '0.500', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.071', 'weapon2': '1.468', 'weapon3': '1.648', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:58:45,819][63767] DAMAGECOUNT value on done: 11683.0 +[2023-09-14 14:58:45,820][63767] Sum rewards: -2.329, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.316', 'AMMO4': '-0.017', 'AMMO2': '-0.003', 'AMMO5': '0.031', 'ARMOR': '0.032', 'AMMO3': '0.143', 'HITCOUNT': '0.210', 'weapon5': '0.270', 'WEAPON5': '0.450', 'DAMAGECOUNT': '0.813', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.562', 'weapon3': '1.896'} +[2023-09-14 14:58:46,570][63734] DAMAGECOUNT value on done: 10592.0 +[2023-09-14 14:58:46,571][63734] Sum rewards: -4.890, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.944', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'ARMOR': '0.004', 'WEAPON1': '0.030', 'AMMO3': '0.098', 'WEAPON4': '0.100', 'HITCOUNT': '0.120', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.650', 'weapon3': '1.518', 'weapon2': '1.840', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:58:46,903][63734] DAMAGECOUNT value on done: 10427.0 +[2023-09-14 14:58:46,903][63734] Sum rewards: -0.483, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.050', 'AMMO5': '0.003', 'AMMO2': '0.003', 'weapon5': '0.008', 'WEAPON1': '0.010', 'AMMO4': '0.015', 'WEAPON5': '0.050', 'ARMOR': '0.084', 'AMMO3': '0.125', 'HITCOUNT': '0.150', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.657', 'weapon2': '1.492', 'weapon3': '1.820', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:58:47,252][63805] DAMAGECOUNT value on done: 11703.0 +[2023-09-14 14:58:47,252][63805] Sum rewards: -6.495, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-3.260', 'AMMO2': '0.003', 'AMMO4': '0.013', 'HITCOUNT': '0.020', 'DAMAGECOUNT': '0.045', 'WEAPON4': '0.100', 'ARMOR': '0.124', 'AMMO3': '0.200', 'weapon4': '0.230', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.444', 'weapon3': '1.636'} +[2023-09-14 14:58:47,467][63454] Saving new best policy, reward=-1.209! +[2023-09-14 14:58:47,598][63805] DAMAGECOUNT value on done: 9243.0 +[2023-09-14 14:58:47,599][63805] Sum rewards: -2.834, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.010', 'AMMO2': '0.004', 'weapon5': '0.006', 'ARMOR': '0.008', 'WEAPON1': '0.010', 'AMMO5': '0.010', 'AMMO4': '0.018', 'weapon4': '0.018', 'AMMO3': '0.088', 'WEAPON4': '0.100', 'HITCOUNT': '0.150', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.510', 'FRAGCOUNT': '1.000', 'weapon3': '1.214', 'weapon2': '1.840'} +[2023-09-14 14:58:48,717][63733] Updated weights for policy 1, policy_version 1770 (0.0011) +[2023-09-14 14:58:49,773][63769] DAMAGECOUNT value on done: 10850.0 +[2023-09-14 14:58:49,774][63769] Sum rewards: -5.423, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.966', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'ARMOR': '0.104', 'AMMO3': '0.127', 'HITCOUNT': '0.250', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.852', 'weapon2': '1.534', 'weapon3': '1.890', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:58:50,114][63769] DAMAGECOUNT value on done: 10003.0 +[2023-09-14 14:58:50,133][63734] DAMAGECOUNT value on done: 10419.0 +[2023-09-14 14:58:50,133][63734] Sum rewards: -3.554, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.856', 'AMMO2': '0.009', 'AMMO5': '0.022', 'ARMOR': '0.024', 'WEAPON1': '0.030', 'AMMO4': '0.045', 'weapon5': '0.146', 'AMMO3': '0.184', 'HITCOUNT': '0.270', 'WEAPON5': '0.350', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.966', 'weapon2': '1.096', 'FRAGCOUNT': '2.000', 'weapon3': '2.510'} +[2023-09-14 14:58:50,537][63734] DAMAGECOUNT value on done: 8696.0 +[2023-09-14 14:58:50,538][63734] Sum rewards: 0.263, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.722', 'AMMO5': '0.015', 'AMMO2': '0.022', 'ARMOR': '0.032', 'WEAPON1': '0.040', 'AMMO4': '0.107', 'AMMO3': '0.136', 'weapon5': '0.306', 'HITCOUNT': '0.320', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'weapon2': '1.280', 'DAMAGECOUNT': '1.365', 'weapon3': '1.912', 'FRAGCOUNT': '3.500'} +[2023-09-14 14:58:51,846][63732] Updated weights for policy 0, policy_version 1880 (0.0011) +[2023-09-14 14:58:52,462][63454] Saving new best policy, reward=-1.188! +[2023-09-14 14:58:54,428][63767] DAMAGECOUNT value on done: 12722.0 +[2023-09-14 14:58:54,429][63767] Sum rewards: -2.973, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.286', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.023', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'AMMO4': '0.116', 'weapon4': '0.150', 'AMMO3': '0.154', 'WEAPON5': '0.200', 'HITCOUNT': '0.310', 'weapon5': '0.398', 'WEAPON3': '0.850', 'weapon2': '1.040', 'DAMAGECOUNT': '1.407', 'FRAGCOUNT': '2.000', 'weapon3': '2.062'} +[2023-09-14 14:58:54,813][63767] DAMAGECOUNT value on done: 14453.0 +[2023-09-14 14:58:54,814][63767] Sum rewards: -1.866, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.346', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'ARMOR': '0.129', 'AMMO3': '0.131', 'weapon4': '0.166', 'WEAPON5': '0.200', 'weapon5': '0.312', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.800', 'weapon2': '1.106', 'FRAGCOUNT': '1.500', 'weapon3': '1.928'} +[2023-09-14 14:58:55,482][63771] DAMAGECOUNT value on done: 9530.0 +[2023-09-14 14:58:55,482][63771] Sum rewards: -0.622, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.892', 'AMMO4': '-0.041', 'AMMO2': '-0.008', 'AMMO5': '0.015', 'ARMOR': '0.044', 'HITCOUNT': '0.090', 'AMMO3': '0.112', 'weapon7': '0.142', 'weapon5': '0.168', 'WEAPON5': '0.200', 'AMMO6': '0.220', 'AMMO7': '0.220', 'WEAPON7': '0.300', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.376', 'weapon3': '1.412'} +[2023-09-14 14:58:55,846][63771] DAMAGECOUNT value on done: 11971.0 +[2023-09-14 14:58:55,847][63771] Sum rewards: -6.492, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-3.000', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.007', 'WEAPON1': '0.030', 'weapon5': '0.088', 'WEAPON4': '0.100', 'weapon4': '0.120', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'AMMO3': '0.215', 'DAMAGECOUNT': '0.447', 'ARMOR': '0.457', 'WEAPON3': '1.000', 'weapon2': '1.508', 'weapon3': '1.996', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:58:55,857][63735] DAMAGECOUNT value on done: 9866.0 +[2023-09-14 14:58:55,899][63733] Updated weights for policy 1, policy_version 1780 (0.0010) +[2023-09-14 14:58:56,262][63735] DAMAGECOUNT value on done: 12303.0 +[2023-09-14 14:58:56,263][63735] Sum rewards: -1.032, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.669', 'AMMO5': '0.007', 'AMMO2': '0.018', 'ARMOR': '0.048', 'WEAPON4': '0.050', 'AMMO4': '0.091', 'weapon4': '0.112', 'weapon5': '0.114', 'AMMO3': '0.138', 'WEAPON5': '0.150', 'HITCOUNT': '0.330', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.692', 'weapon2': '1.748', 'weapon3': '1.788', 'FRAGCOUNT': '2.500'} +[2023-09-14 14:58:56,373][63806] DAMAGECOUNT value on done: 9487.0 +[2023-09-14 14:58:56,373][63806] Sum rewards: 1.829, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.520', 'AMMO2': '0.008', 'AMMO5': '0.018', 'WEAPON1': '0.030', 'AMMO4': '0.041', 'ARMOR': '0.062', 'weapon4': '0.072', 'AMMO3': '0.109', 'WEAPON4': '0.200', 'weapon5': '0.248', 'WEAPON5': '0.350', 'HITCOUNT': '0.360', 'WEAPON3': '0.850', 'weapon2': '1.274', 'DAMAGECOUNT': '1.821', 'weapon3': '1.906', 'FRAGCOUNT': '3.500'} +[2023-09-14 14:58:56,482][63770] DAMAGECOUNT value on done: 12050.0 +[2023-09-14 14:58:56,482][63770] Sum rewards: -0.791, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.860', 'AMMO2': '0.005', 'AMMO5': '0.019', 'WEAPON1': '0.020', 'AMMO4': '0.027', 'ARMOR': '0.056', 'AMMO3': '0.120', 'weapon4': '0.190', 'WEAPON4': '0.200', 'weapon5': '0.266', 'WEAPON5': '0.300', 'HITCOUNT': '0.300', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.050', 'weapon2': '1.280', 'weapon3': '1.586'} +[2023-09-14 14:58:56,709][63806] DAMAGECOUNT value on done: 10425.0 +[2023-09-14 14:58:56,929][63770] DAMAGECOUNT value on done: 8879.0 +[2023-09-14 14:58:56,930][63770] Sum rewards: -3.220, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.711', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'AMMO4': '0.055', 'ARMOR': '0.064', 'AMMO3': '0.152', 'weapon4': '0.160', 'WEAPON4': '0.200', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.840', 'WEAPON3': '0.900', 'weapon2': '1.182', 'weapon3': '1.706', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:58:57,406][63735] DAMAGECOUNT value on done: 11011.0 +[2023-09-14 14:58:57,406][63735] Sum rewards: -0.056, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.143', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.015', 'ARMOR': '0.028', 'WEAPON4': '0.100', 'weapon5': '0.110', 'AMMO3': '0.126', 'weapon4': '0.200', 'WEAPON5': '0.250', 'HITCOUNT': '0.320', 'weapon2': '0.832', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.629', 'weapon3': '2.440', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:58:57,430][63806] DAMAGECOUNT value on done: 10318.0 +[2023-09-14 14:58:57,763][63806] DAMAGECOUNT value on done: 10165.0 +[2023-09-14 14:58:57,763][63806] Sum rewards: -4.453, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.546', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.032', 'AMMO2': '-0.006', 'weapon5': '0.006', 'WEAPON1': '0.010', 'AMMO5': '0.014', 'ARMOR': '0.040', 'AMMO3': '0.112', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.720', 'WEAPON3': '0.750', 'weapon3': '1.430', 'weapon2': '1.668'} +[2023-09-14 14:58:57,791][63735] DAMAGECOUNT value on done: 8508.0 +[2023-09-14 14:58:57,792][63735] Sum rewards: -3.598, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.036', 'AMMO5': '0.003', 'AMMO2': '0.012', 'weapon5': '0.012', 'WEAPON1': '0.020', 'WEAPON5': '0.050', 'AMMO4': '0.058', 'AMMO3': '0.074', 'ARMOR': '0.108', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'weapon4': '0.174', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon3': '1.300', 'weapon2': '1.738'} +[2023-09-14 14:58:59,031][63732] Updated weights for policy 0, policy_version 1890 (0.0011) +[2023-09-14 14:59:00,008][63805] DAMAGECOUNT value on done: 11815.0 +[2023-09-14 14:59:00,008][63805] Sum rewards: 2.489, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.042', 'AMMO2': '0.005', 'weapon7': '0.012', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.025', 'ARMOR': '0.076', 'AMMO3': '0.082', 'weapon4': '0.082', 'WEAPON4': '0.100', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.212', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'WEAPON3': '0.600', 'weapon3': '1.416', 'DAMAGECOUNT': '1.428', 'weapon2': '1.620', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:00,341][63805] DAMAGECOUNT value on done: 13087.0 +[2023-09-14 14:59:00,341][63805] Sum rewards: 0.080, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.336', 'AMMO2': '0.007', 'AMMO5': '0.023', 'AMMO4': '0.036', 'WEAPON4': '0.050', 'ARMOR': '0.096', 'AMMO3': '0.168', 'weapon4': '0.194', 'HITCOUNT': '0.200', 'weapon5': '0.270', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.756', 'WEAPON3': '0.850', 'weapon2': '1.008', 'weapon3': '2.158', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:59:01,095][63771] DAMAGECOUNT value on done: 11342.0 +[2023-09-14 14:59:01,096][63771] Sum rewards: -2.602, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.776', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.002', 'AMMO5': '0.007', 'AMMO4': '0.011', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'weapon5': '0.054', 'weapon4': '0.082', 'AMMO3': '0.111', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.500', 'weapon3': '1.506', 'weapon2': '1.530'} +[2023-09-14 14:59:01,441][63771] DAMAGECOUNT value on done: 8417.0 +[2023-09-14 14:59:02,461][63454] Saving new best policy, reward=-1.176! +[2023-09-14 14:59:03,124][63733] Updated weights for policy 1, policy_version 1790 (0.0011) +[2023-09-14 14:59:05,229][63769] DAMAGECOUNT value on done: 11064.0 +[2023-09-14 14:59:05,230][63769] Sum rewards: -4.439, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.656', 'AMMO2': '0.001', 'AMMO4': '0.006', 'AMMO5': '0.028', 'WEAPON1': '0.030', 'ARMOR': '0.056', 'AMMO3': '0.149', 'HITCOUNT': '0.150', 'DAMAGECOUNT': '0.465', 'weapon5': '0.496', 'WEAPON5': '0.650', 'WEAPON3': '0.950', 'weapon2': '1.204', 'weapon3': '1.782', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:05,679][63769] DAMAGECOUNT value on done: 8066.0 +[2023-09-14 14:59:05,679][63769] Sum rewards: -5.789, reward structure: {'DEATHCOUNT': '-12.000', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO2': '0.009', 'ARMOR': '0.020', 'AMMO4': '0.045', 'WEAPON5': '0.050', 'HITCOUNT': '0.130', 'AMMO3': '0.166', 'HEALTH': '0.358', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.372', 'weapon3': '1.886'} +[2023-09-14 14:59:06,187][63732] Updated weights for policy 0, policy_version 1900 (0.0011) +[2023-09-14 14:59:07,993][63767] DAMAGECOUNT value on done: 12545.0 +[2023-09-14 14:59:07,993][63767] Sum rewards: 0.904, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.700', 'AMMO2': '0.012', 'AMMO5': '0.020', 'WEAPON1': '0.020', 'ARMOR': '0.052', 'AMMO4': '0.061', 'weapon4': '0.092', 'AMMO3': '0.162', 'weapon5': '0.190', 'WEAPON4': '0.200', 'WEAPON5': '0.350', 'HITCOUNT': '0.440', 'WEAPON3': '0.850', 'weapon2': '1.336', 'DAMAGECOUNT': '1.635', 'weapon3': '1.934', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:59:08,307][63770] DAMAGECOUNT value on done: 9372.0 +[2023-09-14 14:59:08,339][63767] DAMAGECOUNT value on done: 11995.0 +[2023-09-14 14:59:08,339][63767] Sum rewards: 0.335, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.328', 'weapon7': '0.002', 'AMMO2': '0.009', 'AMMO5': '0.023', 'AMMO4': '0.043', 'WEAPON4': '0.100', 'AMMO3': '0.113', 'HITCOUNT': '0.130', 'weapon4': '0.186', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.322', 'WEAPON5': '0.450', 'ARMOR': '0.502', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.936', 'weapon3': '1.170', 'weapon2': '1.678', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:59:08,697][63770] DAMAGECOUNT value on done: 10379.0 +[2023-09-14 14:59:08,697][63770] Sum rewards: 3.667, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.056', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'weapon7': '0.014', 'AMMO5': '0.017', 'ARMOR': '0.036', 'WEAPON1': '0.040', 'weapon5': '0.086', 'weapon4': '0.098', 'WEAPON4': '0.100', 'AMMO3': '0.137', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.250', 'HITCOUNT': '0.360', 'WEAPON3': '0.800', 'weapon2': '1.324', 'DAMAGECOUNT': '1.797', 'weapon3': '2.094', 'FRAGCOUNT': '6.000'} +[2023-09-14 14:59:09,568][63734] DAMAGECOUNT value on done: 10822.0 +[2023-09-14 14:59:09,568][63734] Sum rewards: -2.138, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.584', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO2': '0.012', 'weapon4': '0.014', 'AMMO4': '0.059', 'ARMOR': '0.060', 'weapon7': '0.066', 'AMMO3': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'HITCOUNT': '0.140', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.690', 'weapon2': '1.338', 'weapon3': '1.634', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:09,949][63734] DAMAGECOUNT value on done: 10814.0 +[2023-09-14 14:59:09,950][63734] Sum rewards: -0.485, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.391', 'AMMO2': '0.007', 'weapon4': '0.020', 'AMMO4': '0.032', 'weapon7': '0.092', 'WEAPON4': '0.100', 'ARMOR': '0.110', 'AMMO3': '0.116', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'HITCOUNT': '0.210', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.161', 'weapon2': '1.414', 'weapon3': '1.804', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:59:10,070][63805] DAMAGECOUNT value on done: 11827.0 +[2023-09-14 14:59:10,070][63805] Sum rewards: -4.719, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.629', 'AMMO2': '0.004', 'AMMO5': '0.005', 'ARMOR': '0.016', 'AMMO4': '0.019', 'WEAPON4': '0.100', 'HITCOUNT': '0.130', 'AMMO3': '0.156', 'DAMAGECOUNT': '0.372', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.534', 'weapon3': '1.724'} +[2023-09-14 14:59:10,387][63733] Updated weights for policy 1, policy_version 1800 (0.0011) +[2023-09-14 14:59:10,446][63805] DAMAGECOUNT value on done: 9243.0 +[2023-09-14 14:59:12,461][63454] Saving new best policy, reward=-1.097! +[2023-09-14 14:59:13,066][63734] DAMAGECOUNT value on done: 10811.0 +[2023-09-14 14:59:13,066][63734] Sum rewards: -0.674, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.850', 'AMMO2': '0.005', 'AMMO5': '0.005', 'AMMO4': '0.023', 'weapon7': '0.062', 'weapon5': '0.066', 'AMMO3': '0.076', 'WEAPON5': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.290', 'weapon4': '0.408', 'WEAPON3': '0.450', 'ARMOR': '0.525', 'weapon2': '0.758', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.176', 'weapon3': '1.342'} +[2023-09-14 14:59:13,110][63769] DAMAGECOUNT value on done: 10935.0 +[2023-09-14 14:59:13,110][63769] Sum rewards: 0.167, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.007', 'AMMO2': '0.017', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'HITCOUNT': '0.080', 'AMMO4': '0.085', 'AMMO3': '0.088', 'WEAPON5': '0.100', 'weapon4': '0.186', 'DAMAGECOUNT': '0.255', 'WEAPON3': '0.450', 'HEALTH': '0.810', 'FRAGCOUNT': '1.000', 'weapon3': '1.216', 'weapon2': '1.782'} +[2023-09-14 14:59:13,405][63732] Updated weights for policy 0, policy_version 1910 (0.0011) +[2023-09-14 14:59:13,436][63734] DAMAGECOUNT value on done: 8970.0 +[2023-09-14 14:59:13,436][63734] Sum rewards: 2.195, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.304', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.038', 'ARMOR': '0.076', 'weapon5': '0.096', 'AMMO3': '0.103', 'HITCOUNT': '0.210', 'WEAPON5': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.822', 'weapon2': '1.330', 'FRAGCOUNT': '2.000', 'weapon3': '2.244'} +[2023-09-14 14:59:13,481][63769] DAMAGECOUNT value on done: 10103.0 +[2023-09-14 14:59:16,722][63767] DAMAGECOUNT value on done: 13106.0 +[2023-09-14 14:59:16,723][63767] Sum rewards: -4.449, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-2.000', 'HEALTH': '-0.353', 'AMMO2': '0.005', 'AMMO5': '0.010', 'AMMO4': '0.024', 'ARMOR': '0.060', 'AMMO3': '0.145', 'WEAPON5': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.298', 'HITCOUNT': '0.350', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.152', 'weapon2': '1.288', 'weapon3': '2.122'} +[2023-09-14 14:59:17,085][63767] DAMAGECOUNT value on done: 14795.0 +[2023-09-14 14:59:17,086][63767] Sum rewards: 0.318, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.473', 'AMMO5': '0.012', 'AMMO2': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'AMMO4': '0.070', 'AMMO3': '0.090', 'weapon5': '0.132', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'HITCOUNT': '0.200', 'weapon4': '0.202', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.026', 'weapon2': '1.326', 'weapon3': '1.708'} +[2023-09-14 14:59:17,467][63454] Saving new best policy, reward=-1.016! +[2023-09-14 14:59:17,600][63733] Updated weights for policy 1, policy_version 1810 (0.0011) +[2023-09-14 14:59:18,511][63771] DAMAGECOUNT value on done: 9784.0 +[2023-09-14 14:59:18,511][63771] Sum rewards: -0.413, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.520', 'AMMO4': '-0.013', 'AMMO2': '-0.002', 'AMMO5': '0.017', 'weapon5': '0.022', 'AMMO3': '0.133', 'HITCOUNT': '0.250', 'WEAPON5': '0.250', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.762', 'weapon2': '1.428', 'weapon3': '2.010', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:59:18,842][63771] DAMAGECOUNT value on done: 12140.0 +[2023-09-14 14:59:18,842][63771] Sum rewards: -3.891, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.472', 'AMMO5': '0.020', 'AMMO2': '0.024', 'weapon5': '0.036', 'ARMOR': '0.076', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO4': '0.117', 'AMMO3': '0.125', 'weapon7': '0.134', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'weapon4': '0.212', 'WEAPON5': '0.300', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.507', 'weapon2': '1.244', 'weapon3': '1.606'} +[2023-09-14 14:59:19,785][63735] Large shaping reward -2.504 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.255, -85.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 14:59:19,886][63806] DAMAGECOUNT value on done: 10547.0 +[2023-09-14 14:59:19,887][63806] Sum rewards: -0.702, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.266', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'weapon5': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.036', 'AMMO3': '0.102', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.687', 'FRAGCOUNT': '1.000', 'weapon2': '1.084', 'weapon3': '1.910'} +[2023-09-14 14:59:20,199][63806] DAMAGECOUNT value on done: 10230.0 +[2023-09-14 14:59:20,496][63732] Updated weights for policy 0, policy_version 1920 (0.0010) +[2023-09-14 14:59:20,802][63806] DAMAGECOUNT value on done: 10036.0 +[2023-09-14 14:59:20,802][63806] Sum rewards: -2.265, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.274', 'weapon5': '0.002', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'WEAPON5': '0.050', 'ARMOR': '0.052', 'AMMO4': '0.087', 'WEAPON4': '0.100', 'AMMO3': '0.183', 'weapon4': '0.210', 'HITCOUNT': '0.480', 'WEAPON3': '0.900', 'weapon2': '1.536', 'DAMAGECOUNT': '1.647', 'weapon3': '1.732', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:59:20,805][63735] DAMAGECOUNT value on done: 10175.0 +[2023-09-14 14:59:20,806][63735] Sum rewards: -6.058, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.470', 'AMMO4': '-0.058', 'AMMO2': '-0.012', 'AMMO5': '0.010', 'weapon5': '0.010', 'WEAPON1': '0.020', 'AMMO3': '0.117', 'HITCOUNT': '0.200', 'WEAPON5': '0.200', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.927', 'weapon3': '1.670', 'weapon2': '1.778', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:21,239][63806] DAMAGECOUNT value on done: 10600.0 +[2023-09-14 14:59:21,240][63806] Sum rewards: -1.699, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.246', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'AMMO5': '0.015', 'ARMOR': '0.032', 'weapon5': '0.060', 'AMMO3': '0.142', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.525', 'WEAPON3': '0.800', 'weapon2': '1.180', 'weapon3': '1.964', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:21,249][63735] DAMAGECOUNT value on done: 12458.0 +[2023-09-14 14:59:21,249][63735] Sum rewards: -8.204, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-3.000', 'HEALTH': '-2.086', 'AMMO4': '-0.037', 'AMMO2': '-0.007', 'AMMO5': '0.021', 'WEAPON1': '0.030', 'ARMOR': '0.052', 'weapon5': '0.134', 'HITCOUNT': '0.140', 'AMMO3': '0.164', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.950', 'weapon2': '1.782', 'weapon3': '1.788'} +[2023-09-14 14:59:22,092][63770] DAMAGECOUNT value on done: 12755.0 +[2023-09-14 14:59:22,092][63770] Sum rewards: 2.836, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.506', 'AMMO5': '0.013', 'AMMO2': '0.019', 'WEAPON4': '0.050', 'AMMO4': '0.096', 'AMMO3': '0.137', 'weapon4': '0.140', 'WEAPON5': '0.200', 'HITCOUNT': '0.290', 'weapon5': '0.350', 'ARMOR': '0.575', 'WEAPON3': '0.700', 'weapon3': '1.418', 'weapon2': '1.988', 'DAMAGECOUNT': '2.115', 'FRAGCOUNT': '3.500'} +[2023-09-14 14:59:22,328][63735] DAMAGECOUNT value on done: 11465.0 +[2023-09-14 14:59:22,328][63735] Sum rewards: -0.634, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.324', 'AMMO2': '0.005', 'AMMO5': '0.008', 'weapon4': '0.016', 'AMMO4': '0.025', 'weapon5': '0.054', 'WEAPON4': '0.100', 'AMMO3': '0.129', 'WEAPON5': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.350', 'ARMOR': '0.507', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.362', 'weapon2': '1.666', 'weapon3': '1.918', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:22,429][63770] DAMAGECOUNT value on done: 8949.0 +[2023-09-14 14:59:22,430][63770] Sum rewards: -1.526, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO5': '0.005', 'AMMO2': '0.011', 'WEAPON5': '0.050', 'AMMO4': '0.055', 'HITCOUNT': '0.060', 'AMMO3': '0.092', 'HEALTH': '0.140', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon3': '1.566', 'weapon2': '1.584'} +[2023-09-14 14:59:22,732][63735] DAMAGECOUNT value on done: 8583.0 +[2023-09-14 14:59:22,897][63805] DAMAGECOUNT value on done: 12110.0 +[2023-09-14 14:59:22,898][63805] Sum rewards: -0.125, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.122', 'AMMO2': '0.011', 'AMMO5': '0.017', 'AMMO4': '0.053', 'AMMO3': '0.102', 'weapon5': '0.204', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'ARMOR': '0.494', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.885', 'weapon2': '1.558', 'weapon3': '1.782'} +[2023-09-14 14:59:23,235][63805] DAMAGECOUNT value on done: 13314.0 +[2023-09-14 14:59:23,236][63805] Sum rewards: -0.561, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.307', 'AMMO2': '0.014', 'AMMO5': '0.016', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'AMMO4': '0.070', 'AMMO3': '0.078', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon5': '0.184', 'weapon7': '0.196', 'HITCOUNT': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.681', 'FRAGCOUNT': '1.000', 'weapon3': '1.082', 'weapon2': '2.030'} +[2023-09-14 14:59:23,916][63771] DAMAGECOUNT value on done: 11452.0 +[2023-09-14 14:59:23,916][63771] Sum rewards: -1.413, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.800', 'WEAPON1': '0.010', 'AMMO2': '0.028', 'HITCOUNT': '0.070', 'ARMOR': '0.080', 'AMMO3': '0.105', 'AMMO4': '0.138', 'WEAPON4': '0.250', 'weapon4': '0.268', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.088', 'weapon2': '1.420'} +[2023-09-14 14:59:24,309][63771] DAMAGECOUNT value on done: 8557.0 +[2023-09-14 14:59:24,693][63733] Updated weights for policy 1, policy_version 1820 (0.0011) +[2023-09-14 14:59:26,241][63769] Large shaping reward 2.632 for [('FRAGCOUNT', 2.0, 2.0), ('HITCOUNT', 0.03, 3.0), ('DAMAGECOUNT', 0.6, 200), ('weapon7', 0.002)] +[2023-09-14 14:59:27,487][63732] Updated weights for policy 0, policy_version 1930 (0.0012) +[2023-09-14 14:59:29,933][63769] DAMAGECOUNT value on done: 11485.0 +[2023-09-14 14:59:29,933][63769] Sum rewards: -2.360, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.344', 'AMMO2': '0.007', 'ARMOR': '0.024', 'AMMO5': '0.025', 'AMMO4': '0.033', 'weapon7': '0.074', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.140', 'AMMO3': '0.164', 'weapon5': '0.188', 'WEAPON7': '0.200', 'WEAPON5': '0.450', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.263', 'weapon2': '1.360', 'weapon3': '1.916', 'FRAGCOUNT': '2.500'} +[2023-09-14 14:59:30,348][63769] DAMAGECOUNT value on done: 8136.0 +[2023-09-14 14:59:30,349][63769] Sum rewards: -4.752, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.090', 'AMMO2': '0.012', 'ARMOR': '0.040', 'HITCOUNT': '0.060', 'AMMO4': '0.061', 'WEAPON4': '0.100', 'AMMO3': '0.107', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.558', 'weapon2': '1.640'} +[2023-09-14 14:59:30,406][63767] DAMAGECOUNT value on done: 12708.0 +[2023-09-14 14:59:30,406][63767] Sum rewards: 0.455, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.434', 'AMMO5': '0.015', 'AMMO2': '0.029', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'ARMOR': '0.053', 'weapon7': '0.078', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon5': '0.108', 'AMMO3': '0.122', 'AMMO4': '0.143', 'HITCOUNT': '0.160', 'weapon4': '0.188', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.489', 'WEAPON3': '0.700', 'weapon2': '0.734', 'weapon3': '1.990', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:59:30,730][63767] DAMAGECOUNT value on done: 12075.0 +[2023-09-14 14:59:31,551][63733] Updated weights for policy 1, policy_version 1830 (0.0009) +[2023-09-14 14:59:32,465][63734] DAMAGECOUNT value on done: 10857.0 +[2023-09-14 14:59:32,466][63734] Sum rewards: -4.303, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.820', 'AMMO4': '-0.008', 'AMMO2': '-0.002', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'weapon5': '0.032', 'HITCOUNT': '0.040', 'DAMAGECOUNT': '0.105', 'AMMO3': '0.179', 'WEAPON5': '0.200', 'WEAPON3': '0.850', 'weapon2': '1.474', 'weapon3': '1.614', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:32,727][63805] DAMAGECOUNT value on done: 12096.0 +[2023-09-14 14:59:32,727][63805] Sum rewards: -1.249, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.476', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.025', 'weapon5': '0.026', 'ARMOR': '0.040', 'WEAPON5': '0.050', 'AMMO4': '0.127', 'AMMO3': '0.137', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'weapon4': '0.244', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.807', 'weapon2': '1.414', 'weapon3': '1.424', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:32,799][63734] DAMAGECOUNT value on done: 10999.0 +[2023-09-14 14:59:32,799][63734] Sum rewards: -2.584, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.376', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'weapon5': '0.038', 'ARMOR': '0.048', 'AMMO3': '0.118', 'HITCOUNT': '0.150', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.452', 'weapon3': '1.892'} +[2023-09-14 14:59:33,101][63770] DAMAGECOUNT value on done: 9532.0 +[2023-09-14 14:59:33,102][63770] Sum rewards: -2.753, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.675', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.013', 'weapon4': '0.032', 'ARMOR': '0.040', 'AMMO4': '0.067', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.131', 'HITCOUNT': '0.150', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.224', 'weapon3': '2.020'} +[2023-09-14 14:59:33,166][63805] DAMAGECOUNT value on done: 9448.0 +[2023-09-14 14:59:33,167][63805] Sum rewards: -2.281, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.959', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'AMMO5': '0.010', 'weapon5': '0.022', 'ARMOR': '0.024', 'WEAPON5': '0.100', 'AMMO3': '0.146', 'HITCOUNT': '0.150', 'DAMAGECOUNT': '0.615', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.408', 'weapon2': '1.950'} +[2023-09-14 14:59:33,461][63770] DAMAGECOUNT value on done: 10909.0 +[2023-09-14 14:59:33,461][63770] Sum rewards: -1.008, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.895', 'AMMO4': '-0.033', 'AMMO2': '-0.007', 'AMMO5': '0.031', 'weapon4': '0.054', 'weapon7': '0.056', 'WEAPON4': '0.100', 'AMMO3': '0.124', 'weapon5': '0.164', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.360', 'WEAPON5': '0.500', 'WEAPON3': '0.850', 'weapon2': '1.242', 'DAMAGECOUNT': '1.590', 'weapon3': '2.006', 'FRAGCOUNT': '2.500'} +[2023-09-14 14:59:35,220][63732] Updated weights for policy 0, policy_version 1940 (0.0011) +[2023-09-14 14:59:35,967][63734] DAMAGECOUNT value on done: 11371.0 +[2023-09-14 14:59:35,968][63734] Sum rewards: 2.295, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.924', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'AMMO5': '0.010', 'ARMOR': '0.032', 'weapon5': '0.156', 'AMMO3': '0.214', 'WEAPON5': '0.250', 'HITCOUNT': '0.390', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.680', 'weapon2': '1.820', 'weapon3': '1.824', 'FRAGCOUNT': '6.500'} +[2023-09-14 14:59:36,263][63769] DAMAGECOUNT value on done: 11255.0 +[2023-09-14 14:59:36,263][63769] Sum rewards: -4.545, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.577', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'AMMO5': '0.005', 'weapon5': '0.006', 'WEAPON1': '0.020', 'WEAPON5': '0.100', 'AMMO3': '0.149', 'HITCOUNT': '0.250', 'WEAPON3': '0.950', 'DAMAGECOUNT': '0.960', 'FRAGCOUNT': '1.000', 'weapon2': '1.324', 'weapon3': '2.050'} +[2023-09-14 14:59:36,352][63734] DAMAGECOUNT value on done: 9189.0 +[2023-09-14 14:59:36,352][63734] Sum rewards: -0.589, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.825', 'AMMO4': '-0.023', 'AMMO2': '-0.005', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'weapon5': '0.030', 'ARMOR': '0.048', 'weapon7': '0.066', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.157', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.657', 'WEAPON3': '0.700', 'weapon2': '1.480', 'weapon3': '1.916', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:36,600][63769] DAMAGECOUNT value on done: 10500.0 +[2023-09-14 14:59:36,601][63769] Sum rewards: 0.290, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.110', 'AMMO2': '0.022', 'weapon4': '0.028', 'WEAPON4': '0.050', 'weapon7': '0.092', 'AMMO3': '0.096', 'AMMO4': '0.108', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.200', 'WEAPON7': '0.200', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.170', 'weapon2': '1.302', 'weapon3': '1.492', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:59:38,063][63733] Updated weights for policy 1, policy_version 1840 (0.0011) +[2023-09-14 14:59:39,395][63767] DAMAGECOUNT value on done: 13386.0 +[2023-09-14 14:59:39,396][63767] Sum rewards: -3.215, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.126', 'AMMO2': '0.001', 'AMMO4': '0.003', 'WEAPON1': '0.010', 'AMMO5': '0.025', 'ARMOR': '0.028', 'weapon5': '0.094', 'AMMO3': '0.178', 'HITCOUNT': '0.230', 'WEAPON5': '0.500', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.840', 'weapon2': '1.188', 'FRAGCOUNT': '2.000', 'weapon3': '2.264'} +[2023-09-14 14:59:39,733][63767] DAMAGECOUNT value on done: 15427.0 +[2023-09-14 14:59:39,733][63767] Sum rewards: 3.520, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.560', 'AMMO5': '0.007', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'ARMOR': '0.024', 'AMMO4': '0.046', 'weapon7': '0.048', 'AMMO3': '0.107', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon5': '0.194', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.340', 'WEAPON3': '0.650', 'weapon3': '1.664', 'weapon2': '1.694', 'DAMAGECOUNT': '1.896', 'FRAGCOUNT': '3.500'} +[2023-09-14 14:59:41,294][63771] DAMAGECOUNT value on done: 10017.0 +[2023-09-14 14:59:41,295][63771] Sum rewards: 1.262, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.242', 'WEAPON1': '0.010', 'AMMO5': '0.014', 'AMMO2': '0.019', 'ARMOR': '0.024', 'WEAPON4': '0.050', 'AMMO4': '0.096', 'AMMO3': '0.109', 'weapon4': '0.200', 'HITCOUNT': '0.220', 'WEAPON5': '0.300', 'weapon5': '0.334', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.699', 'weapon2': '0.910', 'weapon3': '1.668', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:59:41,647][63771] DAMAGECOUNT value on done: 12650.0 +[2023-09-14 14:59:41,647][63771] Sum rewards: -1.335, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.236', 'weapon7': '0.002', 'ARMOR': '0.004', 'AMMO2': '0.004', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO4': '0.020', 'weapon5': '0.032', 'WEAPON5': '0.100', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'AMMO3': '0.205', 'HITCOUNT': '0.430', 'weapon2': '0.976', 'WEAPON3': '1.100', 'DAMAGECOUNT': '1.530', 'weapon3': '2.632', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:59:42,356][63806] DAMAGECOUNT value on done: 10647.0 +[2023-09-14 14:59:42,356][63806] Sum rewards: -8.655, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-3.052', 'AMMO5': '0.007', 'weapon5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'ARMOR': '0.032', 'AMMO4': '0.055', 'HITCOUNT': '0.080', 'AMMO3': '0.109', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.436', 'weapon3': '1.696'} +[2023-09-14 14:59:42,461][63454] Saving new best policy, reward=-0.894! +[2023-09-14 14:59:42,691][63806] DAMAGECOUNT value on done: 10492.0 +[2023-09-14 14:59:42,691][63806] Sum rewards: 0.730, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.820', 'AMMO5': '0.007', 'AMMO2': '0.010', 'weapon5': '0.038', 'AMMO3': '0.045', 'weapon4': '0.046', 'AMMO4': '0.047', 'ARMOR': '0.068', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'HITCOUNT': '0.210', 'WEAPON3': '0.350', 'DAMAGECOUNT': '0.786', 'weapon3': '1.210', 'weapon2': '1.732', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:43,979][63732] Updated weights for policy 0, policy_version 1950 (0.0011) +[2023-09-14 14:59:43,984][63733] Updated weights for policy 1, policy_version 1850 (0.0011) +[2023-09-14 14:59:44,723][63806] DAMAGECOUNT value on done: 10264.0 +[2023-09-14 14:59:44,724][63806] Sum rewards: -3.826, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.860', 'AMMO2': '0.006', 'AMMO5': '0.015', 'AMMO4': '0.030', 'WEAPON1': '0.040', 'AMMO3': '0.149', 'HITCOUNT': '0.150', 'weapon5': '0.178', 'WEAPON5': '0.300', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.684', 'WEAPON3': '0.750', 'weapon3': '1.512', 'weapon2': '1.720'} +[2023-09-14 14:59:44,937][63735] DAMAGECOUNT value on done: 10390.0 +[2023-09-14 14:59:44,938][63735] Sum rewards: -2.671, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.836', 'AMMO2': '0.005', 'AMMO5': '0.015', 'weapon5': '0.022', 'ARMOR': '0.024', 'AMMO4': '0.027', 'WEAPON1': '0.080', 'AMMO3': '0.138', 'HITCOUNT': '0.180', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.900', 'weapon2': '1.214', 'weapon3': '1.914', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:45,103][63806] DAMAGECOUNT value on done: 10935.0 +[2023-09-14 14:59:45,103][63806] Sum rewards: -1.803, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.912', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'WEAPON1': '0.040', 'ARMOR': '0.072', 'weapon4': '0.078', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'HITCOUNT': '0.270', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.005', 'weapon3': '1.056', 'weapon2': '1.784'} +[2023-09-14 14:59:45,327][63735] DAMAGECOUNT value on done: 13022.0 +[2023-09-14 14:59:45,328][63735] Sum rewards: -0.495, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.804', 'weapon4': '0.006', 'AMMO2': '0.017', 'WEAPON1': '0.020', 'AMMO5': '0.020', 'ARMOR': '0.040', 'AMMO4': '0.086', 'WEAPON4': '0.100', 'weapon5': '0.156', 'AMMO3': '0.176', 'HITCOUNT': '0.260', 'WEAPON5': '0.300', 'WEAPON3': '0.900', 'weapon2': '1.350', 'DAMAGECOUNT': '1.692', 'weapon3': '1.936', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:59:45,646][63805] DAMAGECOUNT value on done: 12551.0 +[2023-09-14 14:59:45,647][63805] Sum rewards: 3.179, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.485', 'AMMO2': '0.007', 'AMMO5': '0.012', 'AMMO4': '0.037', 'AMMO3': '0.164', 'weapon5': '0.186', 'WEAPON5': '0.200', 'HITCOUNT': '0.290', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.323', 'weapon2': '1.420', 'weapon3': '1.774', 'FRAGCOUNT': '5.000'} +[2023-09-14 14:59:46,035][63805] DAMAGECOUNT value on done: 13688.0 +[2023-09-14 14:59:46,035][63805] Sum rewards: 2.184, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.836', 'AMMO2': '0.016', 'weapon7': '0.016', 'AMMO5': '0.025', 'weapon5': '0.052', 'AMMO4': '0.077', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.163', 'WEAPON5': '0.300', 'HITCOUNT': '0.320', 'ARMOR': '0.432', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.927', 'weapon2': '1.348', 'weapon3': '2.294', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:59:46,355][63735] DAMAGECOUNT value on done: 11685.0 +[2023-09-14 14:59:46,356][63735] Sum rewards: -3.556, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.155', 'AMMO4': '-0.018', 'AMMO2': '-0.004', 'AMMO5': '0.015', 'ARMOR': '0.028', 'weapon5': '0.094', 'AMMO3': '0.151', 'WEAPON5': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.220', 'DAMAGECOUNT': '0.660', 'WEAPON3': '0.950', 'weapon2': '1.480', 'weapon3': '1.972', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:46,793][63735] DAMAGECOUNT value on done: 8798.0 +[2023-09-14 14:59:46,794][63735] Sum rewards: -5.196, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.270', 'ARMOR': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.011', 'weapon5': '0.026', 'AMMO4': '0.052', 'AMMO3': '0.140', 'WEAPON5': '0.150', 'HITCOUNT': '0.220', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.596', 'weapon3': '1.666'} +[2023-09-14 14:59:46,980][63770] DAMAGECOUNT value on done: 13021.0 +[2023-09-14 14:59:46,981][63770] Sum rewards: -4.463, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.108', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.011', 'AMMO2': '0.022', 'ARMOR': '0.075', 'AMMO4': '0.109', 'weapon5': '0.124', 'AMMO3': '0.133', 'HITCOUNT': '0.200', 'weapon4': '0.218', 'WEAPON4': '0.250', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.798', 'WEAPON3': '0.900', 'weapon2': '1.154', 'weapon3': '1.850'} +[2023-09-14 14:59:47,226][63771] DAMAGECOUNT value on done: 11492.0 +[2023-09-14 14:59:47,415][63770] DAMAGECOUNT value on done: 9164.0 +[2023-09-14 14:59:47,415][63770] Sum rewards: -2.812, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.470', 'AMMO2': '0.001', 'AMMO4': '0.002', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'ARMOR': '0.016', 'WEAPON4': '0.050', 'weapon5': '0.050', 'weapon4': '0.118', 'HITCOUNT': '0.130', 'AMMO3': '0.149', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.645', 'WEAPON3': '0.800', 'weapon3': '1.288', 'weapon2': '1.494', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:47,468][63454] Saving new best policy, reward=-0.870! +[2023-09-14 14:59:47,612][63771] DAMAGECOUNT value on done: 8604.0 +[2023-09-14 14:59:50,229][63733] Updated weights for policy 1, policy_version 1860 (0.0011) +[2023-09-14 14:59:53,006][63732] Updated weights for policy 0, policy_version 1960 (0.0010) +[2023-09-14 14:59:53,551][63767] DAMAGECOUNT value on done: 12952.0 +[2023-09-14 14:59:53,552][63767] Sum rewards: -0.276, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.472', 'AMMO2': '0.005', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'AMMO4': '0.024', 'ARMOR': '0.076', 'AMMO3': '0.098', 'HITCOUNT': '0.200', 'WEAPON5': '0.250', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.732', 'weapon3': '1.562', 'weapon2': '1.572', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:53,895][63767] DAMAGECOUNT value on done: 12399.0 +[2023-09-14 14:59:53,896][63767] Sum rewards: -2.514, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.188', 'ARMOR': '0.004', 'AMMO2': '0.008', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO4': '0.041', 'AMMO3': '0.113', 'WEAPON5': '0.200', 'HITCOUNT': '0.250', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.972', 'weapon3': '1.558', 'weapon2': '1.848', 'FRAGCOUNT': '4.000'} +[2023-09-14 14:59:55,183][63769] DAMAGECOUNT value on done: 11653.0 +[2023-09-14 14:59:55,183][63769] Sum rewards: -4.674, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.057', 'AMMO5': '0.015', 'AMMO2': '0.029', 'ARMOR': '0.057', 'weapon5': '0.074', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'weapon7': '0.126', 'AMMO4': '0.142', 'AMMO3': '0.152', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.504', 'WEAPON3': '1.050', 'weapon2': '1.656', 'weapon3': '1.848', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:55,541][63769] DAMAGECOUNT value on done: 8324.0 +[2023-09-14 14:59:55,979][63734] DAMAGECOUNT value on done: 11126.0 +[2023-09-14 14:59:55,979][63734] Sum rewards: 1.627, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-1.046', 'weapon4': '0.004', 'AMMO5': '0.005', 'AMMO2': '0.026', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'AMMO3': '0.065', 'ARMOR': '0.076', 'WEAPON5': '0.100', 'weapon5': '0.100', 'AMMO4': '0.128', 'HITCOUNT': '0.180', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.807', 'weapon2': '1.530', 'weapon3': '1.562', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:56,071][63805] DAMAGECOUNT value on done: 12236.0 +[2023-09-14 14:59:56,072][63805] Sum rewards: -1.372, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.050', 'AMMO4': '-0.019', 'AMMO2': '-0.004', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'AMMO3': '0.081', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.550', 'weapon3': '1.316', 'weapon2': '1.858', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:56,343][63733] Updated weights for policy 1, policy_version 1870 (0.0011) +[2023-09-14 14:59:56,350][63734] DAMAGECOUNT value on done: 11169.0 +[2023-09-14 14:59:56,351][63734] Sum rewards: -2.895, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.610', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO2': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.037', 'ARMOR': '0.040', 'WEAPON5': '0.100', 'AMMO3': '0.102', 'HITCOUNT': '0.150', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.600', 'weapon3': '1.412', 'weapon2': '1.726', 'FRAGCOUNT': '2.000'} +[2023-09-14 14:59:56,442][63805] DAMAGECOUNT value on done: 9751.0 +[2023-09-14 14:59:56,442][63805] Sum rewards: -0.807, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.180', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.010', 'ARMOR': '0.012', 'WEAPON5': '0.050', 'AMMO4': '0.050', 'weapon7': '0.086', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.133', 'WEAPON7': '0.200', 'HITCOUNT': '0.240', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.909', 'weapon2': '1.050', 'weapon3': '1.830', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:59:58,721][63734] DAMAGECOUNT value on done: 11783.0 +[2023-09-14 14:59:58,722][63734] Sum rewards: -1.210, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.680', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.022', 'ARMOR': '0.045', 'weapon5': '0.094', 'AMMO3': '0.146', 'WEAPON5': '0.250', 'HITCOUNT': '0.270', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.236', 'weapon2': '1.470', 'FRAGCOUNT': '2.000', 'weapon3': '2.010'} +[2023-09-14 14:59:58,729][63770] DAMAGECOUNT value on done: 9681.0 +[2023-09-14 14:59:59,042][63734] DAMAGECOUNT value on done: 9641.0 +[2023-09-14 14:59:59,043][63734] Sum rewards: 3.247, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.264', 'AMMO5': '0.005', 'AMMO2': '0.010', 'weapon4': '0.028', 'AMMO4': '0.049', 'WEAPON4': '0.050', 'weapon5': '0.054', 'ARMOR': '0.072', 'WEAPON5': '0.100', 'AMMO3': '0.113', 'HITCOUNT': '0.330', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.356', 'weapon2': '1.356', 'weapon3': '1.888', 'FRAGCOUNT': '3.500'} +[2023-09-14 14:59:59,161][63770] DAMAGECOUNT value on done: 11480.0 +[2023-09-14 14:59:59,162][63770] Sum rewards: 1.956, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO5': '0.015', 'AMMO2': '0.023', 'HEALTH': '0.034', 'ARMOR': '0.052', 'weapon7': '0.070', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.115', 'AMMO3': '0.118', 'weapon5': '0.136', 'WEAPON5': '0.250', 'weapon4': '0.350', 'HITCOUNT': '0.510', 'weapon2': '0.558', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.713', 'weapon3': '2.112', 'FRAGCOUNT': '3.000'} +[2023-09-14 14:59:59,896][63769] DAMAGECOUNT value on done: 11496.0 +[2023-09-14 14:59:59,896][63769] Sum rewards: -4.012, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.946', 'AMMO4': '-0.020', 'AMMO2': '-0.004', 'AMMO5': '0.010', 'HITCOUNT': '0.170', 'AMMO3': '0.181', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.723', 'WEAPON3': '1.050', 'weapon2': '1.088', 'FRAGCOUNT': '2.000', 'weapon3': '2.286'} +[2023-09-14 15:00:00,276][63769] DAMAGECOUNT value on done: 10785.0 +[2023-09-14 15:00:00,276][63769] Sum rewards: -2.862, reward structure: {'DEATHCOUNT': '-9.750', 'AMMO2': '0.008', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'weapon5': '0.012', 'ARMOR': '0.028', 'AMMO4': '0.037', 'WEAPON4': '0.050', 'weapon4': '0.062', 'AMMO3': '0.144', 'WEAPON5': '0.150', 'HITCOUNT': '0.220', 'HEALTH': '0.260', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.855', 'FRAGCOUNT': '1.000', 'weapon2': '1.148', 'weapon3': '2.144'} +[2023-09-14 15:00:01,836][63732] Updated weights for policy 0, policy_version 1970 (0.0011) +[2023-09-14 15:00:02,455][63767] DAMAGECOUNT value on done: 13560.0 +[2023-09-14 15:00:02,456][63767] Sum rewards: -2.738, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.150', 'AMMO2': '0.009', 'AMMO5': '0.010', 'ARMOR': '0.016', 'WEAPON1': '0.030', 'weapon5': '0.032', 'AMMO4': '0.045', 'WEAPON4': '0.050', 'weapon4': '0.050', 'AMMO3': '0.087', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.522', 'FRAGCOUNT': '1.000', 'weapon3': '1.098', 'weapon2': '1.892'} +[2023-09-14 15:00:02,459][63733] Updated weights for policy 1, policy_version 1880 (0.0013) +[2023-09-14 15:00:02,469][63454] Saving new best policy, reward=-0.866! +[2023-09-14 15:00:02,779][63767] DAMAGECOUNT value on done: 15627.0 +[2023-09-14 15:00:02,780][63767] Sum rewards: -2.656, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.219', 'AMMO5': '0.005', 'AMMO2': '0.010', 'WEAPON1': '0.040', 'AMMO4': '0.049', 'WEAPON5': '0.100', 'ARMOR': '0.120', 'AMMO3': '0.173', 'HITCOUNT': '0.180', 'DAMAGECOUNT': '0.600', 'WEAPON3': '1.000', 'weapon2': '1.630', 'weapon3': '1.656', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:00:03,751][63771] DAMAGECOUNT value on done: 10331.0 +[2023-09-14 15:00:03,751][63771] Sum rewards: -1.694, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.590', 'AMMO2': '0.014', 'AMMO5': '0.015', 'ARMOR': '0.045', 'AMMO4': '0.068', 'AMMO3': '0.134', 'weapon5': '0.196', 'WEAPON5': '0.250', 'HITCOUNT': '0.290', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.942', 'FRAGCOUNT': '1.000', 'weapon2': '1.310', 'weapon3': '2.132'} +[2023-09-14 15:00:04,082][63771] DAMAGECOUNT value on done: 13077.0 +[2023-09-14 15:00:04,083][63771] Sum rewards: 1.615, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.558', 'AMMO2': '0.004', 'AMMO5': '0.007', 'weapon5': '0.008', 'AMMO4': '0.020', 'WEAPON5': '0.050', 'ARMOR': '0.068', 'weapon7': '0.094', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.135', 'weapon4': '0.196', 'WEAPON7': '0.200', 'HITCOUNT': '0.380', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.281', 'weapon2': '1.322', 'weapon3': '1.418', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:00:07,426][63806] DAMAGECOUNT value on done: 10926.0 +[2023-09-14 15:00:07,426][63806] Sum rewards: -0.059, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.591', 'weapon5': '0.002', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'ARMOR': '0.040', 'AMMO4': '0.041', 'AMMO3': '0.083', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'HITCOUNT': '0.280', 'weapon4': '0.490', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.837', 'weapon2': '1.006', 'weapon3': '1.672', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:00:07,467][63454] Saving new best policy, reward=-0.845! +[2023-09-14 15:00:07,801][63806] DAMAGECOUNT value on done: 10744.0 +[2023-09-14 15:00:07,802][63806] Sum rewards: -0.325, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.230', 'AMMO5': '0.005', 'weapon5': '0.010', 'AMMO2': '0.023', 'weapon4': '0.098', 'WEAPON5': '0.100', 'AMMO3': '0.107', 'AMMO4': '0.114', 'ARMOR': '0.130', 'WEAPON4': '0.150', 'HITCOUNT': '0.220', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.756', 'weapon2': '0.888', 'FRAGCOUNT': '1.000', 'weapon3': '1.654'} +[2023-09-14 15:00:08,198][63805] DAMAGECOUNT value on done: 13111.0 +[2023-09-14 15:00:08,198][63805] Sum rewards: -1.322, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.350', 'AMMO2': '0.010', 'AMMO5': '0.015', 'AMMO4': '0.052', 'ARMOR': '0.128', 'AMMO3': '0.153', 'WEAPON5': '0.250', 'HITCOUNT': '0.270', 'weapon5': '0.278', 'WEAPON3': '0.950', 'weapon3': '1.570', 'DAMAGECOUNT': '1.680', 'weapon2': '1.922', 'FRAGCOUNT': '2.500'} +[2023-09-14 15:00:08,549][63805] DAMAGECOUNT value on done: 14094.0 +[2023-09-14 15:00:08,550][63805] Sum rewards: 3.400, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.007', 'AMMO2': '0.010', 'ARMOR': '0.018', 'AMMO4': '0.047', 'WEAPON4': '0.050', 'weapon5': '0.066', 'AMMO3': '0.080', 'weapon7': '0.092', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.194', 'HITCOUNT': '0.220', 'HEALTH': '0.236', 'WEAPON3': '0.500', 'DAMAGECOUNT': '1.218', 'weapon2': '1.258', 'weapon3': '2.004', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:00:08,634][63733] Updated weights for policy 1, policy_version 1890 (0.0011) +[2023-09-14 15:00:09,621][63735] DAMAGECOUNT value on done: 10498.0 +[2023-09-14 15:00:09,621][63735] Sum rewards: -0.458, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.007', 'weapon5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.019', 'AMMO3': '0.067', 'AMMO4': '0.095', 'HITCOUNT': '0.120', 'WEAPON5': '0.150', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.324', 'HEALTH': '0.487', 'FRAGCOUNT': '1.000', 'weapon3': '1.120', 'weapon2': '1.832'} +[2023-09-14 15:00:09,859][63806] DAMAGECOUNT value on done: 10729.0 +[2023-09-14 15:00:09,859][63806] Sum rewards: -3.922, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.277', 'AMMO4': '-0.008', 'AMMO2': '-0.001', 'AMMO5': '0.013', 'weapon5': '0.030', 'ARMOR': '0.060', 'WEAPON5': '0.150', 'AMMO3': '0.195', 'HITCOUNT': '0.380', 'WEAPON3': '1.100', 'weapon2': '1.310', 'DAMAGECOUNT': '1.395', 'weapon3': '2.482', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:00:10,003][63735] DAMAGECOUNT value on done: 13310.0 +[2023-09-14 15:00:10,004][63735] Sum rewards: -0.366, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO5': '0.005', 'ARMOR': '0.008', 'AMMO2': '0.010', 'WEAPON4': '0.050', 'AMMO4': '0.051', 'WEAPON5': '0.100', 'weapon4': '0.100', 'AMMO3': '0.120', 'weapon5': '0.122', 'HITCOUNT': '0.240', 'HEALTH': '0.284', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.864', 'weapon2': '1.458', 'FRAGCOUNT': '2.000', 'weapon3': '2.022'} +[2023-09-14 15:00:10,279][63806] DAMAGECOUNT value on done: 11185.0 +[2023-09-14 15:00:10,279][63806] Sum rewards: -1.372, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.014', 'AMMO4': '-0.000', 'AMMO2': '0.000', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'weapon4': '0.044', 'ARMOR': '0.048', 'WEAPON4': '0.050', 'AMMO3': '0.138', 'WEAPON5': '0.150', 'HITCOUNT': '0.240', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.750', 'weapon2': '1.276', 'weapon3': '1.718', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:00:10,279][63771] DAMAGECOUNT value on done: 11507.0 +[2023-09-14 15:00:10,608][63771] DAMAGECOUNT value on done: 8994.0 +[2023-09-14 15:00:10,609][63771] Sum rewards: -2.482, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.242', 'AMMO4': '-0.008', 'AMMO2': '-0.002', 'weapon5': '0.002', 'AMMO5': '0.007', 'ARMOR': '0.040', 'AMMO3': '0.142', 'WEAPON5': '0.150', 'HITCOUNT': '0.280', 'WEAPON3': '0.950', 'DAMAGECOUNT': '1.170', 'weapon2': '1.572', 'weapon3': '1.956', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:00:11,084][63735] DAMAGECOUNT value on done: 11893.0 +[2023-09-14 15:00:11,085][63735] Sum rewards: -2.958, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.180', 'AMMO2': '0.003', 'AMMO5': '0.007', 'AMMO4': '0.012', 'weapon4': '0.068', 'WEAPON4': '0.100', 'AMMO3': '0.153', 'weapon5': '0.178', 'HITCOUNT': '0.200', 'WEAPON5': '0.250', 'WEAPON3': '0.500', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.624', 'weapon2': '1.252', 'weapon3': '1.874'} +[2023-09-14 15:00:11,204][63732] Updated weights for policy 0, policy_version 1980 (0.0011) +[2023-09-14 15:00:11,545][63735] DAMAGECOUNT value on done: 9023.0 +[2023-09-14 15:00:11,545][63735] Sum rewards: -4.348, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.358', 'weapon5': '0.014', 'AMMO2': '0.014', 'WEAPON1': '0.020', 'AMMO5': '0.023', 'ARMOR': '0.046', 'weapon4': '0.048', 'AMMO4': '0.070', 'WEAPON4': '0.100', 'AMMO3': '0.122', 'HITCOUNT': '0.160', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.616', 'weapon2': '1.702'} +[2023-09-14 15:00:12,463][63454] Saving new best policy, reward=-0.728! +[2023-09-14 15:00:12,649][63770] DAMAGECOUNT value on done: 13206.0 +[2023-09-14 15:00:12,649][63770] Sum rewards: -0.320, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.507', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'ARMOR': '0.064', 'AMMO3': '0.093', 'HITCOUNT': '0.150', 'weapon5': '0.158', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.606', 'weapon3': '1.696'} +[2023-09-14 15:00:13,035][63770] DAMAGECOUNT value on done: 9389.0 +[2023-09-14 15:00:13,036][63770] Sum rewards: 0.105, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.040', 'AMMO5': '0.013', 'ARMOR': '0.015', 'AMMO2': '0.016', 'WEAPON1': '0.030', 'weapon5': '0.036', 'AMMO4': '0.081', 'AMMO3': '0.085', 'WEAPON4': '0.100', 'weapon4': '0.180', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.675', 'weapon3': '0.986', 'FRAGCOUNT': '1.000', 'weapon2': '2.208'} +[2023-09-14 15:00:14,040][63733] Updated weights for policy 1, policy_version 1900 (0.0010) +[2023-09-14 15:00:16,392][63767] DAMAGECOUNT value on done: 12952.0 +[2023-09-14 15:00:16,704][63767] DAMAGECOUNT value on done: 12699.0 +[2023-09-14 15:00:16,705][63767] Sum rewards: -1.932, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.330', 'AMMO2': '0.001', 'AMMO4': '0.005', 'AMMO5': '0.007', 'weapon5': '0.012', 'WEAPON1': '0.030', 'AMMO3': '0.128', 'WEAPON5': '0.150', 'HITCOUNT': '0.190', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.900', 'weapon2': '1.496', 'weapon3': '1.928', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:00:17,466][63454] Saving new best policy, reward=-0.676! +[2023-09-14 15:00:19,365][63734] DAMAGECOUNT value on done: 11216.0 +[2023-09-14 15:00:19,366][63734] Sum rewards: -0.874, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.007', 'AMMO2': '0.026', 'WEAPON1': '0.030', 'HEALTH': '0.050', 'weapon5': '0.054', 'ARMOR': '0.080', 'HITCOUNT': '0.090', 'weapon4': '0.094', 'AMMO3': '0.098', 'AMMO4': '0.129', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.270', 'WEAPON3': '0.400', 'weapon3': '1.194', 'weapon2': '1.754', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:00:19,431][63805] DAMAGECOUNT value on done: 12405.0 +[2023-09-14 15:00:19,431][63805] Sum rewards: -3.583, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.495', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'weapon5': '0.006', 'AMMO5': '0.015', 'ARMOR': '0.068', 'AMMO3': '0.161', 'HITCOUNT': '0.170', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.850', 'weapon2': '1.574', 'FRAGCOUNT': '2.000', 'weapon3': '2.016'} +[2023-09-14 15:00:19,657][63733] Updated weights for policy 1, policy_version 1910 (0.0011) +[2023-09-14 15:00:19,758][63734] DAMAGECOUNT value on done: 11184.0 +[2023-09-14 15:00:19,823][63805] DAMAGECOUNT value on done: 10312.0 +[2023-09-14 15:00:19,823][63805] Sum rewards: -2.775, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.820', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.036', 'AMMO3': '0.167', 'WEAPON5': '0.300', 'HITCOUNT': '0.450', 'WEAPON3': '0.950', 'weapon2': '1.454', 'DAMAGECOUNT': '1.683', 'weapon3': '1.740', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:00:20,261][63769] DAMAGECOUNT value on done: 11818.0 +[2023-09-14 15:00:20,663][63769] DAMAGECOUNT value on done: 8461.0 +[2023-09-14 15:00:20,663][63769] Sum rewards: -1.441, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.294', 'AMMO5': '0.010', 'AMMO2': '0.014', 'WEAPON1': '0.020', 'weapon5': '0.022', 'weapon4': '0.040', 'AMMO4': '0.071', 'ARMOR': '0.076', 'AMMO3': '0.100', 'WEAPON4': '0.100', 'HITCOUNT': '0.120', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.411', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.350', 'weapon3': '1.668'} +[2023-09-14 15:00:20,967][63734] DAMAGECOUNT value on done: 12324.0 +[2023-09-14 15:00:20,968][63734] Sum rewards: -0.146, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.820', 'AMMO2': '0.008', 'AMMO5': '0.021', 'AMMO4': '0.037', 'WEAPON4': '0.050', 'AMMO3': '0.125', 'weapon5': '0.180', 'HITCOUNT': '0.310', 'WEAPON5': '0.450', 'WEAPON3': '0.700', 'weapon2': '1.230', 'DAMAGECOUNT': '1.623', 'FRAGCOUNT': '2.000', 'weapon3': '2.190'} +[2023-09-14 15:00:21,294][63734] DAMAGECOUNT value on done: 9935.0 +[2023-09-14 15:00:21,295][63734] Sum rewards: -2.508, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.712', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.010', 'WEAPON4': '0.100', 'weapon4': '0.100', 'ARMOR': '0.108', 'AMMO3': '0.133', 'HITCOUNT': '0.140', 'WEAPON5': '0.200', 'weapon5': '0.330', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.882', 'weapon2': '1.510', 'weapon3': '1.628'} +[2023-09-14 15:00:21,609][63732] Updated weights for policy 0, policy_version 1990 (0.0010) +[2023-09-14 15:00:22,462][63576] Saving new best policy, reward=-2.726! +[2023-09-14 15:00:23,676][63769] DAMAGECOUNT value on done: 11696.0 +[2023-09-14 15:00:23,676][63769] Sum rewards: -0.950, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.202', 'AMMO4': '-0.045', 'AMMO2': '-0.009', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'weapon5': '0.036', 'ARMOR': '0.044', 'WEAPON5': '0.100', 'AMMO3': '0.147', 'HITCOUNT': '0.220', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.900', 'weapon2': '1.398', 'weapon3': '1.836', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:00:24,008][63770] DAMAGECOUNT value on done: 9981.0 +[2023-09-14 15:00:24,009][63770] Sum rewards: -4.953, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.305', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'weapon5': '0.002', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'ARMOR': '0.040', 'WEAPON5': '0.100', 'AMMO3': '0.153', 'HITCOUNT': '0.250', 'DAMAGECOUNT': '0.900', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.296', 'weapon3': '2.162'} +[2023-09-14 15:00:24,062][63769] DAMAGECOUNT value on done: 10995.0 +[2023-09-14 15:00:24,063][63769] Sum rewards: -2.662, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.006', 'AMMO2': '0.004', 'AMMO5': '0.005', 'weapon5': '0.008', 'AMMO4': '0.022', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'weapon4': '0.114', 'HITCOUNT': '0.130', 'AMMO3': '0.147', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.850', 'weapon2': '0.974', 'FRAGCOUNT': '2.000', 'weapon3': '2.240'} +[2023-09-14 15:00:24,365][63770] DAMAGECOUNT value on done: 11844.0 +[2023-09-14 15:00:24,365][63770] Sum rewards: 3.271, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.695', 'AMMO2': '0.004', 'AMMO5': '0.007', 'AMMO4': '0.019', 'ARMOR': '0.056', 'weapon5': '0.074', 'AMMO3': '0.112', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'weapon7': '0.308', 'HITCOUNT': '0.310', 'weapon4': '0.336', 'AMMO6': '0.400', 'WEAPON7': '0.400', 'AMMO7': '0.400', 'WEAPON3': '0.650', 'weapon2': '0.788', 'DAMAGECOUNT': '1.092', 'weapon3': '1.810', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:00:25,094][63733] Updated weights for policy 1, policy_version 1920 (0.0010) +[2023-09-14 15:00:25,389][63767] DAMAGECOUNT value on done: 13586.0 +[2023-09-14 15:00:25,670][63771] DAMAGECOUNT value on done: 10663.0 +[2023-09-14 15:00:25,670][63771] Sum rewards: 1.448, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.384', 'AMMO5': '0.010', 'AMMO2': '0.015', 'WEAPON5': '0.050', 'AMMO4': '0.075', 'AMMO3': '0.104', 'weapon5': '0.114', 'WEAPON4': '0.150', 'weapon4': '0.176', 'HITCOUNT': '0.290', 'ARMOR': '0.468', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.996', 'weapon3': '1.178', 'weapon2': '1.606', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:00:25,796][63767] DAMAGECOUNT value on done: 15742.0 +[2023-09-14 15:00:26,069][63805] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 15:00:26,079][63771] DAMAGECOUNT value on done: 13680.0 +[2023-09-14 15:00:26,079][63771] Sum rewards: 6.388, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'AMMO5': '0.007', 'ARMOR': '0.008', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'weapon7': '0.050', 'AMMO3': '0.070', 'weapon5': '0.078', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon4': '0.124', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HEALTH': '0.307', 'WEAPON3': '0.350', 'HITCOUNT': '0.400', 'weapon2': '1.092', 'weapon3': '1.384', 'DAMAGECOUNT': '1.809', 'FRAGCOUNT': '6.000'} +[2023-09-14 15:00:27,467][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001924_7880704.pth... +[2023-09-14 15:00:27,467][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001995_8171520.pth... +[2023-09-14 15:00:27,538][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001669_6836224.pth +[2023-09-14 15:00:27,539][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001586_6496256.pth +[2023-09-14 15:00:27,548][63454] Saving new best policy, reward=-0.596! +[2023-09-14 15:00:30,306][63733] Updated weights for policy 1, policy_version 1930 (0.0011) +[2023-09-14 15:00:31,394][63805] DAMAGECOUNT value on done: 13357.0 +[2023-09-14 15:00:31,394][63805] Sum rewards: -3.185, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.542', 'AMMO5': '0.003', 'AMMO2': '0.013', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'AMMO4': '0.067', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'weapon4': '0.132', 'HITCOUNT': '0.230', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.738', 'FRAGCOUNT': '1.000', 'weapon3': '1.136', 'weapon2': '2.082'} +[2023-09-14 15:00:31,719][63805] DAMAGECOUNT value on done: 14294.0 +[2023-09-14 15:00:31,719][63805] Sum rewards: -6.637, reward structure: {'DEATHCOUNT': '-9.000', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.126', 'AMMO2': '0.002', 'AMMO5': '0.007', 'AMMO4': '0.011', 'weapon5': '0.026', 'WEAPON1': '0.060', 'AMMO3': '0.102', 'WEAPON5': '0.150', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.650', 'weapon2': '1.474', 'weapon3': '1.696'} +[2023-09-14 15:00:32,016][63806] DAMAGECOUNT value on done: 10941.0 +[2023-09-14 15:00:32,016][63806] Sum rewards: -2.193, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.624', 'AMMO5': '0.003', 'AMMO2': '0.008', 'HITCOUNT': '0.010', 'WEAPON1': '0.010', 'weapon5': '0.012', 'AMMO4': '0.041', 'DAMAGECOUNT': '0.045', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'AMMO3': '0.084', 'weapon4': '0.130', 'ARMOR': '0.176', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.282', 'weapon2': '1.780'} +[2023-09-14 15:00:32,434][63806] DAMAGECOUNT value on done: 11122.0 +[2023-09-14 15:00:32,435][63806] Sum rewards: -2.234, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.681', 'AMMO2': '0.006', 'AMMO5': '0.020', 'AMMO4': '0.032', 'ARMOR': '0.044', 'weapon4': '0.118', 'weapon5': '0.130', 'AMMO3': '0.135', 'WEAPON4': '0.150', 'HITCOUNT': '0.280', 'WEAPON5': '0.350', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.134', 'weapon2': '1.452', 'weapon3': '1.596'} +[2023-09-14 15:00:33,581][63732] Updated weights for policy 0, policy_version 2000 (0.0012) +[2023-09-14 15:00:33,785][63771] DAMAGECOUNT value on done: 11627.0 +[2023-09-14 15:00:33,785][63771] Sum rewards: 0.978, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.040', 'weapon4': '0.010', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'AMMO2': '0.015', 'weapon5': '0.022', 'weapon7': '0.076', 'AMMO4': '0.076', 'HITCOUNT': '0.080', 'AMMO3': '0.087', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.650', 'weapon2': '1.182', 'weapon3': '1.844', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:00:33,925][63735] DAMAGECOUNT value on done: 10503.0 +[2023-09-14 15:00:34,161][63771] DAMAGECOUNT value on done: 9219.0 +[2023-09-14 15:00:34,162][63771] Sum rewards: -5.378, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.644', 'AMMO5': '0.007', 'weapon5': '0.012', 'AMMO2': '0.015', 'weapon4': '0.018', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'AMMO4': '0.074', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'AMMO3': '0.225', 'DAMAGECOUNT': '0.675', 'weapon2': '0.720', 'WEAPON3': '1.200', 'FRAGCOUNT': '2.000', 'weapon3': '2.670'} +[2023-09-14 15:00:34,253][63735] DAMAGECOUNT value on done: 13593.0 +[2023-09-14 15:00:34,253][63735] Sum rewards: 2.282, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-0.238', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'AMMO3': '0.050', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon7': '0.154', 'HITCOUNT': '0.190', 'WEAPON7': '0.200', 'weapon5': '0.268', 'WEAPON5': '0.300', 'WEAPON3': '0.350', 'FRAGCOUNT': '0.500', 'ARMOR': '0.504', 'DAMAGECOUNT': '0.849', 'weapon3': '1.194', 'weapon2': '1.452'} +[2023-09-14 15:00:34,477][63806] DAMAGECOUNT value on done: 11090.0 +[2023-09-14 15:00:34,477][63806] Sum rewards: -4.599, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.358', 'AMMO5': '0.016', 'AMMO2': '0.019', 'ARMOR': '0.072', 'AMMO4': '0.096', 'weapon5': '0.100', 'AMMO3': '0.188', 'HITCOUNT': '0.200', 'WEAPON4': '0.200', 'WEAPON5': '0.350', 'DAMAGECOUNT': '1.083', 'WEAPON3': '1.150', 'weapon2': '1.574', 'weapon3': '1.960', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:00:34,828][63806] DAMAGECOUNT value on done: 11338.0 +[2023-09-14 15:00:34,829][63806] Sum rewards: -4.345, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.128', 'AMMO5': '0.003', 'AMMO2': '0.013', 'weapon4': '0.018', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.065', 'ARMOR': '0.076', 'AMMO3': '0.157', 'HITCOUNT': '0.160', 'DAMAGECOUNT': '0.459', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.760', 'weapon2': '1.872'} +[2023-09-14 15:00:35,420][63735] DAMAGECOUNT value on done: 12302.0 +[2023-09-14 15:00:35,420][63735] Sum rewards: 0.944, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.898', 'AMMO2': '0.006', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.027', 'weapon5': '0.034', 'weapon7': '0.074', 'ARMOR': '0.104', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.121', 'WEAPON5': '0.150', 'WEAPON7': '0.200', 'WEAPON4': '0.250', 'HITCOUNT': '0.350', 'weapon4': '0.388', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.227', 'weapon3': '1.610', 'weapon2': '1.634', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:00:35,497][63733] Updated weights for policy 1, policy_version 1940 (0.0010) +[2023-09-14 15:00:35,790][63735] DAMAGECOUNT value on done: 9217.0 +[2023-09-14 15:00:35,791][63735] Sum rewards: -0.620, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.034', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'AMMO5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.040', 'weapon5': '0.070', 'AMMO3': '0.117', 'HITCOUNT': '0.210', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.582', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.688', 'weapon2': '1.774'} +[2023-09-14 15:00:38,050][63770] DAMAGECOUNT value on done: 13646.0 +[2023-09-14 15:00:38,051][63770] Sum rewards: 1.800, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.986', 'AMMO2': '0.002', 'AMMO4': '0.008', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.062', 'AMMO3': '0.127', 'weapon5': '0.140', 'HITCOUNT': '0.190', 'AMMO6': '0.240', 'AMMO7': '0.240', 'weapon7': '0.292', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'weapon4': '0.366', 'WEAPON7': '0.400', 'WEAPON3': '0.850', 'weapon2': '1.270', 'DAMAGECOUNT': '1.320', 'weapon3': '1.394', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:00:38,441][63770] DAMAGECOUNT value on done: 9455.0 +[2023-09-14 15:00:39,882][63767] DAMAGECOUNT value on done: 13170.0 +[2023-09-14 15:00:39,883][63767] Sum rewards: -3.295, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.420', 'AMMO2': '0.012', 'WEAPON1': '0.040', 'AMMO4': '0.060', 'ARMOR': '0.112', 'AMMO3': '0.115', 'WEAPON4': '0.150', 'HITCOUNT': '0.160', 'weapon4': '0.328', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.654', 'FRAGCOUNT': '1.000', 'weapon3': '1.414', 'weapon2': '1.680'} +[2023-09-14 15:00:40,272][63767] DAMAGECOUNT value on done: 12808.0 +[2023-09-14 15:00:40,573][63733] Updated weights for policy 1, policy_version 1950 (0.0010) +[2023-09-14 15:00:42,461][63454] Saving new best policy, reward=-0.583! +[2023-09-14 15:00:42,892][63734] DAMAGECOUNT value on done: 12891.0 +[2023-09-14 15:00:42,893][63734] Sum rewards: -0.610, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.267', 'AMMO5': '0.005', 'AMMO2': '0.014', 'weapon5': '0.052', 'AMMO4': '0.067', 'AMMO3': '0.125', 'WEAPON5': '0.150', 'weapon4': '0.308', 'WEAPON4': '0.350', 'HITCOUNT': '0.460', 'ARMOR': '0.571', 'WEAPON3': '0.850', 'weapon2': '1.518', 'DAMAGECOUNT': '1.701', 'weapon3': '1.736', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:00:43,030][63805] DAMAGECOUNT value on done: 12610.0 +[2023-09-14 15:00:43,030][63805] Sum rewards: -1.170, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.730', 'weapon5': '0.002', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.010', 'ARMOR': '0.024', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.051', 'AMMO3': '0.121', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.615', 'WEAPON3': '0.750', 'weapon2': '1.090', 'FRAGCOUNT': '2.000', 'weapon3': '2.114'} +[2023-09-14 15:00:43,208][63734] DAMAGECOUNT value on done: 10616.0 +[2023-09-14 15:00:43,208][63734] Sum rewards: 4.440, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.457', 'AMMO5': '0.005', 'AMMO2': '0.006', 'AMMO4': '0.030', 'WEAPON5': '0.100', 'weapon5': '0.106', 'AMMO3': '0.113', 'HITCOUNT': '0.460', 'ARMOR': '0.502', 'WEAPON3': '0.650', 'weapon3': '1.540', 'DAMAGECOUNT': '2.043', 'weapon2': '2.092', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:00:43,257][63734] DAMAGECOUNT value on done: 11316.0 +[2023-09-14 15:00:43,386][63805] DAMAGECOUNT value on done: 10387.0 +[2023-09-14 15:00:43,616][63734] DAMAGECOUNT value on done: 11561.0 +[2023-09-14 15:00:43,616][63734] Sum rewards: 0.436, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.645', 'AMMO5': '0.005', 'AMMO2': '0.013', 'AMMO4': '0.065', 'weapon4': '0.088', 'WEAPON5': '0.100', 'ARMOR': '0.120', 'AMMO3': '0.134', 'WEAPON4': '0.200', 'HITCOUNT': '0.260', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.131', 'weapon3': '1.558', 'weapon2': '1.906', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:00:45,494][63769] DAMAGECOUNT value on done: 11943.0 +[2023-09-14 15:00:45,672][63733] Updated weights for policy 1, policy_version 1960 (0.0011) +[2023-09-14 15:00:45,893][63769] DAMAGECOUNT value on done: 8730.0 +[2023-09-14 15:00:45,894][63769] Sum rewards: 1.501, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.747', 'AMMO5': '0.010', 'AMMO2': '0.018', 'WEAPON1': '0.030', 'ARMOR': '0.044', 'AMMO3': '0.084', 'AMMO4': '0.091', 'weapon6': '0.092', 'HITCOUNT': '0.160', 'AMMO6': '0.194', 'AMMO7': '0.194', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'WEAPON6': '0.200', 'weapon4': '0.252', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.807', 'weapon3': '1.310', 'weapon2': '1.562', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:00:46,484][63732] Updated weights for policy 0, policy_version 2010 (0.0010) +[2023-09-14 15:00:47,467][63454] Saving new best policy, reward=-0.464! +[2023-09-14 15:00:47,894][63769] DAMAGECOUNT value on done: 11725.0 +[2023-09-14 15:00:47,894][63769] Sum rewards: -5.506, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-1.023', 'AMMO2': '0.001', 'AMMO5': '0.003', 'AMMO4': '0.006', 'weapon5': '0.008', 'HITCOUNT': '0.050', 'WEAPON5': '0.050', 'DAMAGECOUNT': '0.087', 'ARMOR': '0.090', 'AMMO3': '0.094', 'WEAPON3': '0.600', 'weapon3': '1.094', 'weapon2': '2.434'} +[2023-09-14 15:00:48,235][63769] DAMAGECOUNT value on done: 11171.0 +[2023-09-14 15:00:49,127][63767] DAMAGECOUNT value on done: 13741.0 +[2023-09-14 15:00:49,402][63770] DAMAGECOUNT value on done: 10426.0 +[2023-09-14 15:00:49,403][63770] Sum rewards: 5.023, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.410', 'AMMO5': '0.005', 'AMMO2': '0.013', 'weapon5': '0.056', 'AMMO4': '0.063', 'AMMO3': '0.099', 'WEAPON5': '0.100', 'ARMOR': '0.108', 'WEAPON4': '0.200', 'HITCOUNT': '0.340', 'weapon4': '0.394', 'WEAPON3': '0.700', 'weapon3': '1.250', 'DAMAGECOUNT': '1.335', 'weapon2': '1.770', 'FRAGCOUNT': '6.000'} +[2023-09-14 15:00:49,538][63771] DAMAGECOUNT value on done: 10808.0 +[2023-09-14 15:00:49,539][63771] Sum rewards: -0.457, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.085', 'AMMO4': '-0.055', 'AMMO2': '-0.011', 'AMMO5': '0.005', 'weapon5': '0.046', 'AMMO3': '0.060', 'ARMOR': '0.088', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.480', 'weapon2': '2.120'} +[2023-09-14 15:00:49,539][63767] DAMAGECOUNT value on done: 16023.0 +[2023-09-14 15:00:49,539][63767] Sum rewards: 0.239, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.196', 'AMMO2': '0.015', 'AMMO5': '0.020', 'WEAPON1': '0.020', 'weapon5': '0.038', 'ARMOR': '0.040', 'AMMO4': '0.076', 'AMMO3': '0.131', 'HITCOUNT': '0.250', 'WEAPON5': '0.300', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.843', 'weapon2': '1.466', 'weapon3': '1.936', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:00:49,810][63770] DAMAGECOUNT value on done: 12432.0 +[2023-09-14 15:00:49,810][63770] Sum rewards: 8.596, reward structure: {'DEATHCOUNT': '-3.000', 'AMMO2': '0.007', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.035', 'AMMO3': '0.060', 'WEAPON5': '0.100', 'HITCOUNT': '0.260', 'HEALTH': '0.282', 'weapon5': '0.320', 'WEAPON3': '0.350', 'ARMOR': '0.827', 'weapon2': '1.112', 'weapon3': '1.458', 'DAMAGECOUNT': '1.764', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:00:49,913][63771] DAMAGECOUNT value on done: 13850.0 +[2023-09-14 15:00:51,029][63733] Updated weights for policy 1, policy_version 1970 (0.0010) +[2023-09-14 15:00:52,462][63576] Saving new best policy, reward=-2.707! +[2023-09-14 15:00:52,462][63454] Saving new best policy, reward=-0.363! +[2023-09-14 15:00:55,449][63805] DAMAGECOUNT value on done: 13607.0 +[2023-09-14 15:00:55,811][63805] DAMAGECOUNT value on done: 14544.0 +[2023-09-14 15:00:55,811][63805] Sum rewards: 0.105, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO5': '0.007', 'weapon5': '0.018', 'AMMO2': '0.021', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'AMMO3': '0.061', 'weapon4': '0.070', 'WEAPON5': '0.100', 'AMMO4': '0.104', 'HITCOUNT': '0.200', 'WEAPON3': '0.350', 'HEALTH': '0.728', 'DAMAGECOUNT': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.364', 'weapon2': '2.002'} +[2023-09-14 15:00:56,521][63733] Updated weights for policy 1, policy_version 1980 (0.0011) +[2023-09-14 15:00:56,787][63806] DAMAGECOUNT value on done: 11298.0 +[2023-09-14 15:00:56,788][63806] Sum rewards: -2.743, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.528', 'weapon5': '0.002', 'AMMO2': '0.005', 'AMMO5': '0.018', 'AMMO4': '0.025', 'ARMOR': '0.040', 'AMMO3': '0.156', 'WEAPON5': '0.250', 'HITCOUNT': '0.270', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.071', 'weapon3': '1.306', 'weapon2': '2.142', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:00:57,252][63806] DAMAGECOUNT value on done: 11393.0 +[2023-09-14 15:00:57,252][63806] Sum rewards: -4.469, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.994', 'FRAGCOUNT': '-1.000', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.017', 'WEAPON4': '0.100', 'AMMO3': '0.158', 'weapon4': '0.168', 'weapon5': '0.188', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.230', 'WEAPON5': '0.250', 'ARMOR': '0.539', 'DAMAGECOUNT': '0.813', 'weapon2': '1.032', 'WEAPON3': '1.100', 'weapon3': '2.304'} +[2023-09-14 15:00:57,468][63576] Saving new best policy, reward=-2.684! +[2023-09-14 15:00:58,398][63732] Updated weights for policy 0, policy_version 2020 (0.0013) +[2023-09-14 15:00:58,444][63806] DAMAGECOUNT value on done: 11231.0 +[2023-09-14 15:00:58,445][63806] Sum rewards: -6.906, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.752', 'AMMO2': '0.007', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.032', 'weapon5': '0.036', 'WEAPON4': '0.050', 'weapon4': '0.056', 'ARMOR': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.155', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.423', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.364', 'weapon3': '2.178'} +[2023-09-14 15:00:58,703][63735] DAMAGECOUNT value on done: 10853.0 +[2023-09-14 15:00:58,703][63735] Sum rewards: -2.617, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.813', 'AMMO2': '0.003', 'AMMO4': '0.016', 'ARMOR': '0.092', 'WEAPON4': '0.100', 'AMMO3': '0.115', 'weapon4': '0.136', 'HITCOUNT': '0.310', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.050', 'weapon2': '1.478', 'FRAGCOUNT': '2.000', 'weapon3': '2.046'} +[2023-09-14 15:00:58,840][63806] DAMAGECOUNT value on done: 11593.0 +[2023-09-14 15:00:58,840][63806] Sum rewards: -2.235, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.172', 'AMMO2': '0.019', 'WEAPON1': '0.020', 'AMMO5': '0.023', 'weapon5': '0.048', 'AMMO4': '0.094', 'WEAPON4': '0.100', 'AMMO3': '0.145', 'HITCOUNT': '0.220', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.765', 'WEAPON3': '0.800', 'weapon2': '1.512', 'weapon3': '1.842', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:00:58,873][63771] DAMAGECOUNT value on done: 11802.0 +[2023-09-14 15:00:58,874][63771] Sum rewards: -2.729, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.724', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO2': '0.020', 'weapon4': '0.046', 'weapon5': '0.052', 'ARMOR': '0.096', 'AMMO4': '0.101', 'AMMO3': '0.123', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.525', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.554', 'weapon3': '1.720'} +[2023-09-14 15:00:59,117][63735] DAMAGECOUNT value on done: 13983.0 +[2023-09-14 15:00:59,118][63735] Sum rewards: -0.375, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.814', 'AMMO5': '0.007', 'AMMO2': '0.009', 'WEAPON1': '0.020', 'weapon4': '0.026', 'ARMOR': '0.040', 'AMMO4': '0.047', 'weapon5': '0.084', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'AMMO3': '0.174', 'HITCOUNT': '0.300', 'WEAPON3': '0.850', 'weapon2': '1.160', 'DAMAGECOUNT': '1.170', 'weapon3': '2.302', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:00:59,257][63771] DAMAGECOUNT value on done: 9428.0 +[2023-09-14 15:00:59,258][63771] Sum rewards: -1.382, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.452', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.012', 'weapon5': '0.038', 'weapon4': '0.044', 'WEAPON4': '0.050', 'ARMOR': '0.056', 'AMMO4': '0.061', 'AMMO3': '0.088', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.627', 'weapon3': '1.346', 'FRAGCOUNT': '2.000', 'weapon2': '2.118'} +[2023-09-14 15:01:00,246][63735] DAMAGECOUNT value on done: 12717.0 +[2023-09-14 15:01:00,246][63735] Sum rewards: -1.082, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.780', 'AMMO4': '-0.014', 'AMMO2': '-0.003', 'ARMOR': '0.012', 'AMMO5': '0.015', 'weapon5': '0.064', 'weapon7': '0.082', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.128', 'WEAPON7': '0.200', 'HITCOUNT': '0.240', 'WEAPON5': '0.300', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.245', 'weapon2': '1.534', 'weapon3': '1.654', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:01:00,629][63735] DAMAGECOUNT value on done: 9297.0 +[2023-09-14 15:01:00,629][63735] Sum rewards: -5.717, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.284', 'AMMO4': '-0.014', 'AMMO2': '-0.003', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'weapon5': '0.020', 'ARMOR': '0.032', 'HITCOUNT': '0.090', 'WEAPON5': '0.100', 'AMMO3': '0.165', 'DAMAGECOUNT': '0.240', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.334', 'weapon2': '2.278'} +[2023-09-14 15:01:02,001][63733] Updated weights for policy 1, policy_version 1990 (0.0011) +[2023-09-14 15:01:03,610][63770] DAMAGECOUNT value on done: 13990.0 +[2023-09-14 15:01:03,610][63770] Sum rewards: 0.658, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.760', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.020', 'AMMO2': '0.024', 'weapon5': '0.048', 'AMMO3': '0.079', 'AMMO4': '0.122', 'WEAPON4': '0.150', 'WEAPON5': '0.250', 'HITCOUNT': '0.320', 'WEAPON3': '0.350', 'weapon4': '0.354', 'DAMAGECOUNT': '1.032', 'weapon2': '1.264', 'weapon3': '1.370', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:03,796][63767] DAMAGECOUNT value on done: 13305.0 +[2023-09-14 15:01:03,797][63767] Sum rewards: -2.925, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.512', 'ARMOR': '0.008', 'weapon5': '0.010', 'AMMO5': '0.015', 'AMMO2': '0.024', 'WEAPON1': '0.050', 'AMMO3': '0.110', 'AMMO4': '0.120', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'weapon4': '0.156', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.340', 'weapon3': '1.718'} +[2023-09-14 15:01:04,045][63770] DAMAGECOUNT value on done: 9810.0 +[2023-09-14 15:01:04,046][63770] Sum rewards: -3.169, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.566', 'AMMO2': '0.015', 'WEAPON1': '0.020', 'weapon5': '0.024', 'AMMO5': '0.028', 'AMMO4': '0.076', 'AMMO3': '0.133', 'HITCOUNT': '0.330', 'WEAPON5': '0.500', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.065', 'weapon2': '1.216', 'FRAGCOUNT': '2.000', 'weapon3': '2.340'} +[2023-09-14 15:01:04,201][63767] DAMAGECOUNT value on done: 12938.0 +[2023-09-14 15:01:04,203][63767] Sum rewards: -2.353, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.580', 'AMMO2': '0.002', 'weapon5': '0.006', 'AMMO5': '0.007', 'AMMO4': '0.008', 'WEAPON1': '0.020', 'HITCOUNT': '0.070', 'ARMOR': '0.080', 'WEAPON5': '0.150', 'AMMO3': '0.162', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.700', 'weapon2': '1.642', 'weapon3': '1.990', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:05,559][63734] DAMAGECOUNT value on done: 13146.0 +[2023-09-14 15:01:05,559][63734] Sum rewards: -2.853, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.016', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'AMMO5': '0.005', 'WEAPON5': '0.100', 'ARMOR': '0.132', 'HITCOUNT': '0.190', 'AMMO3': '0.192', 'WEAPON4': '0.200', 'weapon4': '0.374', 'DAMAGECOUNT': '0.678', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.284', 'weapon3': '1.510'} +[2023-09-14 15:01:05,973][63734] DAMAGECOUNT value on done: 10983.0 +[2023-09-14 15:01:05,974][63734] Sum rewards: -2.384, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.777', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.024', 'weapon5': '0.034', 'weapon7': '0.048', 'ARMOR': '0.052', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.137', 'WEAPON5': '0.150', 'HITCOUNT': '0.320', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.101', 'weapon2': '1.282', 'weapon3': '2.132'} +[2023-09-14 15:01:07,182][63733] Updated weights for policy 1, policy_version 2000 (0.0012) +[2023-09-14 15:01:07,345][63805] DAMAGECOUNT value on done: 12780.0 +[2023-09-14 15:01:07,345][63805] Sum rewards: -2.050, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.226', 'AMMO4': '-0.017', 'AMMO2': '-0.003', 'AMMO5': '0.007', 'weapon5': '0.010', 'WEAPON1': '0.030', 'weapon7': '0.070', 'AMMO3': '0.101', 'HITCOUNT': '0.110', 'WEAPON5': '0.150', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'ARMOR': '0.440', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.466', 'weapon2': '1.732'} +[2023-09-14 15:01:07,467][63576] Saving new best policy, reward=-2.616! +[2023-09-14 15:01:07,646][63734] DAMAGECOUNT value on done: 11501.0 +[2023-09-14 15:01:07,647][63734] Sum rewards: 1.367, reward structure: {'DEATHCOUNT': '-5.250', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO2': '0.006', 'AMMO4': '0.032', 'WEAPON5': '0.050', 'HEALTH': '0.078', 'AMMO3': '0.109', 'HITCOUNT': '0.140', 'ARMOR': '0.440', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.555', 'FRAGCOUNT': '1.000', 'weapon3': '1.524', 'weapon2': '2.228'} +[2023-09-14 15:01:07,771][63805] DAMAGECOUNT value on done: 10531.0 +[2023-09-14 15:01:07,771][63805] Sum rewards: -3.020, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.656', 'AMMO5': '0.009', 'AMMO2': '0.010', 'WEAPON1': '0.030', 'ARMOR': '0.032', 'AMMO4': '0.051', 'weapon5': '0.052', 'weapon4': '0.066', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'AMMO3': '0.124', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.432', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.654', 'weapon2': '1.686'} +[2023-09-14 15:01:08,033][63734] DAMAGECOUNT value on done: 11872.0 +[2023-09-14 15:01:08,034][63734] Sum rewards: -1.417, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.830', 'AMMO2': '0.006', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'weapon5': '0.028', 'AMMO4': '0.028', 'AMMO3': '0.153', 'WEAPON5': '0.250', 'HITCOUNT': '0.300', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.933', 'weapon3': '1.810', 'weapon2': '1.822', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:01:08,174][63769] DAMAGECOUNT value on done: 12611.0 +[2023-09-14 15:01:08,175][63769] Sum rewards: 2.441, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.444', 'AMMO4': '-0.030', 'AMMO2': '-0.006', 'ARMOR': '0.008', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'weapon7': '0.050', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.153', 'weapon5': '0.190', 'WEAPON7': '0.200', 'WEAPON5': '0.300', 'HITCOUNT': '0.340', 'WEAPON3': '0.650', 'weapon2': '1.130', 'DAMAGECOUNT': '2.004', 'weapon3': '2.134', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:01:08,588][63769] DAMAGECOUNT value on done: 8856.0 +[2023-09-14 15:01:08,588][63769] Sum rewards: -2.510, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.648', 'AMMO2': '0.003', 'AMMO5': '0.012', 'AMMO4': '0.017', 'WEAPON1': '0.040', 'HITCOUNT': '0.050', 'AMMO3': '0.135', 'weapon5': '0.228', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.378', 'ARMOR': '0.440', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.022', 'weapon3': '1.362'} +[2023-09-14 15:01:11,152][63732] Updated weights for policy 0, policy_version 2030 (0.0012) +[2023-09-14 15:01:12,355][63733] Updated weights for policy 1, policy_version 2010 (0.0011) +[2023-09-14 15:01:12,452][63769] DAMAGECOUNT value on done: 12030.0 +[2023-09-14 15:01:12,452][63769] Sum rewards: -3.545, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.082', 'AMMO4': '-0.017', 'AMMO2': '-0.003', 'weapon5': '0.006', 'AMMO5': '0.018', 'WEAPON1': '0.030', 'ARMOR': '0.084', 'AMMO3': '0.155', 'HITCOUNT': '0.190', 'WEAPON5': '0.350', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.915', 'weapon2': '1.468', 'weapon3': '1.942', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:12,462][63576] Saving new best policy, reward=-2.529! +[2023-09-14 15:01:12,839][63769] DAMAGECOUNT value on done: 11356.0 +[2023-09-14 15:01:12,840][63769] Sum rewards: -2.750, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.375', 'weapon5': '0.002', 'AMMO2': '0.014', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'AMMO4': '0.069', 'AMMO3': '0.161', 'HITCOUNT': '0.170', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.412', 'weapon3': '2.254'} +[2023-09-14 15:01:13,283][63767] DAMAGECOUNT value on done: 13957.0 +[2023-09-14 15:01:13,284][63767] Sum rewards: -5.421, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.334', 'AMMO2': '0.003', 'AMMO4': '0.014', 'AMMO5': '0.017', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'weapon5': '0.050', 'AMMO3': '0.110', 'HITCOUNT': '0.180', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.648', 'WEAPON3': '0.700', 'weapon3': '1.512', 'weapon2': '1.898', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:13,655][63767] DAMAGECOUNT value on done: 16302.0 +[2023-09-14 15:01:13,656][63767] Sum rewards: -1.413, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.442', 'AMMO2': '0.011', 'AMMO5': '0.012', 'weapon5': '0.042', 'WEAPON1': '0.050', 'AMMO4': '0.057', 'ARMOR': '0.072', 'AMMO3': '0.088', 'WEAPON4': '0.100', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.837', 'FRAGCOUNT': '1.000', 'weapon2': '1.586', 'weapon3': '1.754'} +[2023-09-14 15:01:14,289][63771] DAMAGECOUNT value on done: 11149.0 +[2023-09-14 15:01:14,290][63771] Sum rewards: -5.854, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-3.044', 'AMMO4': '-0.022', 'AMMO2': '-0.004', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'weapon5': '0.074', 'ARMOR': '0.076', 'WEAPON5': '0.100', 'AMMO3': '0.172', 'HITCOUNT': '0.280', 'DAMAGECOUNT': '1.023', 'WEAPON3': '1.150', 'weapon2': '1.598', 'weapon3': '1.968', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:14,692][63771] DAMAGECOUNT value on done: 13951.0 +[2023-09-14 15:01:14,692][63771] Sum rewards: -2.149, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.260', 'ARMOR': '0.008', 'WEAPON1': '0.010', 'AMMO2': '0.022', 'HITCOUNT': '0.090', 'AMMO3': '0.105', 'AMMO4': '0.111', 'weapon4': '0.178', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.288', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.596', 'weapon2': '1.752'} +[2023-09-14 15:01:15,346][63770] DAMAGECOUNT value on done: 10556.0 +[2023-09-14 15:01:15,347][63770] Sum rewards: 0.413, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.764', 'AMMO2': '0.010', 'weapon5': '0.016', 'AMMO5': '0.020', 'WEAPON1': '0.030', 'AMMO4': '0.049', 'ARMOR': '0.080', 'HITCOUNT': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.102', 'weapon4': '0.192', 'DAMAGECOUNT': '0.390', 'WEAPON5': '0.400', 'WEAPON3': '0.600', 'weapon3': '1.282', 'weapon2': '1.826', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:15,754][63770] DAMAGECOUNT value on done: 12782.0 +[2023-09-14 15:01:15,755][63770] Sum rewards: -5.528, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.600', 'AMMO5': '0.010', 'AMMO2': '0.013', 'ARMOR': '0.045', 'AMMO4': '0.065', 'weapon5': '0.068', 'WEAPON1': '0.070', 'AMMO3': '0.151', 'WEAPON5': '0.250', 'HITCOUNT': '0.370', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.050', 'weapon2': '1.254', 'weapon3': '2.176'} +[2023-09-14 15:01:17,688][63733] Updated weights for policy 1, policy_version 2020 (0.0011) +[2023-09-14 15:01:19,599][63805] DAMAGECOUNT value on done: 13887.0 +[2023-09-14 15:01:19,599][63805] Sum rewards: -2.039, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.312', 'AMMO2': '0.008', 'AMMO5': '0.013', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.042', 'WEAPON4': '0.050', 'AMMO3': '0.110', 'weapon4': '0.148', 'WEAPON5': '0.150', 'HITCOUNT': '0.270', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.840', 'FRAGCOUNT': '1.000', 'weapon3': '1.502', 'weapon2': '1.788'} +[2023-09-14 15:01:20,007][63805] DAMAGECOUNT value on done: 14683.0 +[2023-09-14 15:01:21,325][63806] DAMAGECOUNT value on done: 11639.0 +[2023-09-14 15:01:21,326][63806] Sum rewards: -2.268, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.994', 'AMMO2': '0.000', 'AMMO4': '0.002', 'AMMO5': '0.010', 'ARMOR': '0.028', 'WEAPON1': '0.040', 'weapon5': '0.056', 'AMMO3': '0.093', 'WEAPON5': '0.200', 'HITCOUNT': '0.290', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.023', 'weapon3': '1.520', 'FRAGCOUNT': '2.000', 'weapon2': '2.014'} +[2023-09-14 15:01:21,724][63806] DAMAGECOUNT value on done: 11314.0 +[2023-09-14 15:01:21,786][63806] DAMAGECOUNT value on done: 11767.0 +[2023-09-14 15:01:21,786][63806] Sum rewards: -6.161, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.770', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.031', 'AMMO2': '-0.006', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.080', 'weapon5': '0.130', 'AMMO3': '0.178', 'WEAPON5': '0.300', 'HITCOUNT': '0.310', 'WEAPON3': '1.100', 'DAMAGECOUNT': '1.122', 'weapon2': '1.360', 'weapon3': '2.040'} +[2023-09-14 15:01:22,138][63806] DAMAGECOUNT value on done: 11732.0 +[2023-09-14 15:01:22,865][63732] Updated weights for policy 0, policy_version 2040 (0.0011) +[2023-09-14 15:01:22,998][63733] Updated weights for policy 1, policy_version 2030 (0.0011) +[2023-09-14 15:01:23,823][63735] DAMAGECOUNT value on done: 10868.0 +[2023-09-14 15:01:24,236][63735] DAMAGECOUNT value on done: 13077.0 +[2023-09-14 15:01:24,236][63735] Sum rewards: -8.533, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-3.120', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.007', 'WEAPON5': '0.150', 'AMMO3': '0.234', 'HITCOUNT': '0.310', 'DAMAGECOUNT': '1.080', 'WEAPON3': '1.400', 'weapon2': '1.614', 'FRAGCOUNT': '2.000', 'weapon3': '2.054'} +[2023-09-14 15:01:24,252][63735] DAMAGECOUNT value on done: 14343.0 +[2023-09-14 15:01:24,253][63735] Sum rewards: -0.662, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.610', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'weapon5': '0.028', 'AMMO3': '0.139', 'WEAPON5': '0.150', 'HITCOUNT': '0.200', 'ARMOR': '0.489', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.080', 'weapon2': '1.252', 'weapon3': '1.950', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:01:24,311][63771] DAMAGECOUNT value on done: 12011.0 +[2023-09-14 15:01:24,312][63771] Sum rewards: -2.216, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.934', 'AMMO5': '0.005', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.059', 'WEAPON5': '0.100', 'weapon4': '0.130', 'WEAPON4': '0.150', 'AMMO3': '0.153', 'HITCOUNT': '0.170', 'ARMOR': '0.574', 'DAMAGECOUNT': '0.627', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.332', 'weapon3': '1.686'} +[2023-09-14 15:01:24,665][63735] DAMAGECOUNT value on done: 9487.0 +[2023-09-14 15:01:24,666][63735] Sum rewards: -5.564, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.910', 'AMMO2': '0.014', 'WEAPON1': '0.040', 'AMMO4': '0.071', 'HITCOUNT': '0.130', 'AMMO3': '0.191', 'DAMAGECOUNT': '0.570', 'WEAPON3': '1.000', 'weapon2': '1.510', 'weapon3': '2.070', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:01:24,724][63771] DAMAGECOUNT value on done: 9778.0 +[2023-09-14 15:01:24,724][63771] Sum rewards: 2.295, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO5': '0.003', 'weapon5': '0.016', 'WEAPON1': '0.020', 'AMMO2': '0.025', 'WEAPON5': '0.050', 'ARMOR': '0.076', 'HEALTH': '0.088', 'AMMO3': '0.098', 'AMMO4': '0.125', 'weapon4': '0.144', 'WEAPON4': '0.150', 'HITCOUNT': '0.310', 'WEAPON3': '0.550', 'DAMAGECOUNT': '1.050', 'weapon3': '1.558', 'weapon2': '1.782', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:01:27,881][63767] DAMAGECOUNT value on done: 13698.0 +[2023-09-14 15:01:27,881][63767] Sum rewards: 0.510, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.060', 'weapon4': '0.002', 'AMMO5': '0.007', 'AMMO2': '0.012', 'weapon5': '0.026', 'WEAPON1': '0.030', 'AMMO4': '0.062', 'ARMOR': '0.068', 'WEAPON4': '0.100', 'AMMO3': '0.111', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.179', 'weapon2': '1.598', 'weapon3': '1.824', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:01:27,886][63734] DAMAGECOUNT value on done: 13455.0 +[2023-09-14 15:01:27,886][63734] Sum rewards: -2.012, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.116', 'AMMO5': '0.003', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'weapon5': '0.034', 'AMMO4': '0.035', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO3': '0.126', 'ARMOR': '0.128', 'weapon4': '0.212', 'HITCOUNT': '0.260', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.927', 'FRAGCOUNT': '1.000', 'weapon2': '1.220', 'weapon3': '1.692'} +[2023-09-14 15:01:28,206][63767] DAMAGECOUNT value on done: 13088.0 +[2023-09-14 15:01:28,241][63734] DAMAGECOUNT value on done: 11358.0 +[2023-09-14 15:01:28,242][63734] Sum rewards: -5.473, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.965', 'FRAGCOUNT': '-0.500', 'ARMOR': '0.008', 'WEAPON1': '0.010', 'AMMO2': '0.014', 'AMMO5': '0.020', 'weapon5': '0.026', 'AMMO4': '0.071', 'WEAPON4': '0.150', 'AMMO3': '0.156', 'weapon4': '0.252', 'HITCOUNT': '0.280', 'WEAPON5': '0.400', 'WEAPON3': '0.900', 'weapon2': '0.986', 'DAMAGECOUNT': '1.125', 'weapon3': '2.094'} +[2023-09-14 15:01:28,337][63733] Updated weights for policy 1, policy_version 2040 (0.0012) +[2023-09-14 15:01:29,164][63770] DAMAGECOUNT value on done: 14253.0 +[2023-09-14 15:01:29,164][63770] Sum rewards: -2.478, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.750', 'AMMO2': '0.004', 'AMMO5': '0.017', 'AMMO4': '0.019', 'weapon5': '0.030', 'weapon7': '0.096', 'AMMO3': '0.124', 'HITCOUNT': '0.210', 'AMMO6': '0.220', 'AMMO7': '0.220', 'WEAPON5': '0.250', 'WEAPON7': '0.300', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.789', 'WEAPON3': '0.850', 'weapon2': '1.160', 'weapon3': '1.984'} +[2023-09-14 15:01:29,537][63770] DAMAGECOUNT value on done: 10073.0 +[2023-09-14 15:01:29,537][63770] Sum rewards: 1.190, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.010', 'weapon4': '0.012', 'weapon5': '0.024', 'ARMOR': '0.039', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO4': '0.050', 'AMMO3': '0.070', 'HITCOUNT': '0.180', 'WEAPON3': '0.350', 'HEALTH': '0.432', 'DAMAGECOUNT': '0.789', 'FRAGCOUNT': '1.000', 'weapon3': '1.456', 'weapon2': '1.912'} +[2023-09-14 15:01:30,066][63805] Large shaping reward 2.640 for [('FRAGCOUNT', 2.0, 2.0), ('HITCOUNT', 0.04, 4.0), ('DAMAGECOUNT', 0.6, 200)] +[2023-09-14 15:01:30,380][63769] DAMAGECOUNT value on done: 13153.0 +[2023-09-14 15:01:30,381][63769] Sum rewards: 2.567, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.005', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'ARMOR': '0.024', 'AMMO4': '0.036', 'weapon5': '0.036', 'HEALTH': '0.037', 'WEAPON5': '0.050', 'AMMO3': '0.106', 'HITCOUNT': '0.370', 'WEAPON3': '0.650', 'weapon2': '1.156', 'DAMAGECOUNT': '1.626', 'weapon3': '1.954', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:01:30,735][63769] DAMAGECOUNT value on done: 9251.0 +[2023-09-14 15:01:30,736][63769] Sum rewards: 2.460, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.356', 'AMMO5': '0.017', 'AMMO2': '0.018', 'WEAPON1': '0.070', 'ARMOR': '0.076', 'AMMO4': '0.090', 'WEAPON4': '0.100', 'weapon4': '0.136', 'AMMO3': '0.150', 'weapon5': '0.204', 'HITCOUNT': '0.280', 'WEAPON5': '0.350', 'weapon2': '0.732', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.185', 'weapon3': '2.158', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:01:31,160][63805] DAMAGECOUNT value on done: 13025.0 +[2023-09-14 15:01:31,161][63805] Sum rewards: 1.400, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.766', 'WEAPON1': '0.010', 'AMMO2': '0.010', 'AMMO5': '0.013', 'weapon4': '0.022', 'WEAPON4': '0.050', 'AMMO4': '0.051', 'weapon5': '0.062', 'AMMO3': '0.085', 'WEAPON5': '0.150', 'HITCOUNT': '0.180', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.735', 'weapon2': '1.608', 'weapon3': '1.890', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:31,553][63805] DAMAGECOUNT value on done: 10671.0 +[2023-09-14 15:01:31,553][63805] Sum rewards: -3.491, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.960', 'AMMO5': '0.009', 'weapon4': '0.012', 'WEAPON1': '0.020', 'AMMO2': '0.025', 'ARMOR': '0.040', 'HITCOUNT': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.125', 'weapon5': '0.126', 'AMMO3': '0.127', 'DAMAGECOUNT': '0.420', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.800', 'weapon3': '1.582', 'weapon2': '1.632'} +[2023-09-14 15:01:31,797][63734] DAMAGECOUNT value on done: 11867.0 +[2023-09-14 15:01:31,797][63734] Sum rewards: -0.730, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.075', 'AMMO2': '0.009', 'AMMO4': '0.042', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO3': '0.088', 'weapon4': '0.248', 'HITCOUNT': '0.260', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.098', 'weapon3': '1.586', 'FRAGCOUNT': '2.000', 'weapon2': '2.000'} +[2023-09-14 15:01:32,198][63734] DAMAGECOUNT value on done: 11947.0 +[2023-09-14 15:01:32,461][63576] Saving new best policy, reward=-2.526! +[2023-09-14 15:01:33,671][63733] Updated weights for policy 1, policy_version 2050 (0.0010) +[2023-09-14 15:01:34,600][63732] Updated weights for policy 0, policy_version 2050 (0.0011) +[2023-09-14 15:01:37,091][63767] DAMAGECOUNT value on done: 14112.0 +[2023-09-14 15:01:37,467][63576] Saving new best policy, reward=-2.489! +[2023-09-14 15:01:37,475][63767] DAMAGECOUNT value on done: 16482.0 +[2023-09-14 15:01:37,475][63767] Sum rewards: -7.726, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.978', 'AMMO2': '0.008', 'WEAPON1': '0.040', 'AMMO4': '0.040', 'AMMO3': '0.143', 'HITCOUNT': '0.180', 'ARMOR': '0.484', 'DAMAGECOUNT': '0.540', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '1.674', 'weapon2': '1.942'} +[2023-09-14 15:01:37,571][63769] DAMAGECOUNT value on done: 12388.0 +[2023-09-14 15:01:37,571][63769] Sum rewards: -1.564, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.434', 'AMMO2': '0.004', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.021', 'weapon5': '0.088', 'AMMO3': '0.138', 'HITCOUNT': '0.200', 'WEAPON5': '0.300', 'ARMOR': '0.420', 'WEAPON3': '0.850', 'weapon2': '1.004', 'DAMAGECOUNT': '1.074', 'weapon3': '1.986', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:37,959][63769] DAMAGECOUNT value on done: 11396.0 +[2023-09-14 15:01:37,959][63769] Sum rewards: -0.305, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.222', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.011', 'WEAPON1': '0.040', 'HITCOUNT': '0.050', 'AMMO4': '0.056', 'ARMOR': '0.080', 'AMMO3': '0.097', 'DAMAGECOUNT': '0.120', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'weapon4': '0.400', 'WEAPON3': '0.650', 'weapon3': '1.328', 'weapon2': '1.716', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:38,144][63771] DAMAGECOUNT value on done: 11184.0 +[2023-09-14 15:01:38,522][63771] DAMAGECOUNT value on done: 14066.0 +[2023-09-14 15:01:39,000][63733] Updated weights for policy 1, policy_version 2060 (0.0012) +[2023-09-14 15:01:40,722][63770] DAMAGECOUNT value on done: 10659.0 +[2023-09-14 15:01:41,131][63770] DAMAGECOUNT value on done: 12964.0 +[2023-09-14 15:01:43,381][63805] DAMAGECOUNT value on done: 14167.0 +[2023-09-14 15:01:43,382][63805] Sum rewards: -0.393, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.843', 'AMMO5': '0.010', 'AMMO2': '0.011', 'WEAPON1': '0.050', 'AMMO4': '0.054', 'weapon5': '0.078', 'ARMOR': '0.080', 'AMMO3': '0.087', 'WEAPON4': '0.150', 'HITCOUNT': '0.160', 'weapon4': '0.168', 'WEAPON5': '0.200', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.840', 'weapon2': '1.266', 'weapon3': '1.946', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:01:43,760][63805] DAMAGECOUNT value on done: 15173.0 +[2023-09-14 15:01:43,761][63805] Sum rewards: 2.963, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.270', 'AMMO4': '-0.041', 'AMMO2': '-0.008', 'weapon5': '0.004', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO3': '0.061', 'ARMOR': '0.073', 'weapon7': '0.080', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.210', 'WEAPON3': '0.450', 'DAMAGECOUNT': '1.302', 'weapon3': '1.456', 'weapon2': '1.976', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:01:44,164][63733] Updated weights for policy 1, policy_version 2070 (0.0010) +[2023-09-14 15:01:45,294][63806] DAMAGECOUNT value on done: 11694.0 +[2023-09-14 15:01:45,295][63806] Sum rewards: 2.125, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.560', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.024', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'AMMO3': '0.098', 'weapon4': '0.100', 'AMMO4': '0.119', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'HITCOUNT': '0.360', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.140', 'weapon3': '1.648', 'weapon2': '1.658', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:01:45,681][63806] DAMAGECOUNT value on done: 11992.0 +[2023-09-14 15:01:45,681][63806] Sum rewards: 1.262, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.005', 'AMMO2': '0.012', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'AMMO4': '0.059', 'AMMO3': '0.060', 'weapon4': '0.062', 'WEAPON5': '0.100', 'weapon5': '0.136', 'HEALTH': '0.178', 'HITCOUNT': '0.180', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.780', 'weapon3': '1.416', 'weapon2': '1.794', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:46,062][63806] DAMAGECOUNT value on done: 11819.0 +[2023-09-14 15:01:46,062][63806] Sum rewards: -0.717, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.480', 'AMMO4': '-0.008', 'AMMO2': '-0.002', 'AMMO5': '0.009', 'weapon5': '0.030', 'WEAPON1': '0.040', 'ARMOR': '0.045', 'AMMO3': '0.093', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.540', 'FRAGCOUNT': '1.000', 'weapon3': '1.274', 'weapon2': '1.940'} +[2023-09-14 15:01:46,420][63806] DAMAGECOUNT value on done: 12025.0 +[2023-09-14 15:01:46,421][63806] Sum rewards: -5.894, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.972', 'AMMO2': '0.002', 'AMMO4': '0.009', 'AMMO5': '0.015', 'weapon5': '0.034', 'ARMOR': '0.052', 'AMMO3': '0.187', 'HITCOUNT': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.729', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.306', 'weapon3': '2.244'} +[2023-09-14 15:01:46,572][63732] Updated weights for policy 0, policy_version 2060 (0.0011) +[2023-09-14 15:01:47,467][63576] Saving new best policy, reward=-2.279! +[2023-09-14 15:01:47,564][63735] DAMAGECOUNT value on done: 13283.0 +[2023-09-14 15:01:47,565][63735] Sum rewards: 0.871, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.187', 'WEAPON1': '0.010', 'AMMO2': '0.036', 'AMMO3': '0.097', 'ARMOR': '0.108', 'HITCOUNT': '0.180', 'AMMO4': '0.181', 'WEAPON4': '0.300', 'WEAPON3': '0.300', 'weapon4': '0.318', 'DAMAGECOUNT': '0.618', 'weapon3': '1.004', 'weapon2': '1.906', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:47,952][63735] DAMAGECOUNT value on done: 9542.0 +[2023-09-14 15:01:47,952][63735] Sum rewards: -2.648, reward structure: {'DEATHCOUNT': '-5.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.430', 'AMMO5': '0.010', 'AMMO2': '0.017', 'WEAPON1': '0.040', 'HITCOUNT': '0.050', 'AMMO3': '0.060', 'ARMOR': '0.066', 'AMMO4': '0.082', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.165', 'weapon5': '0.190', 'WEAPON5': '0.200', 'weapon4': '0.362', 'WEAPON3': '0.450', 'weapon2': '1.320', 'weapon3': '1.370'} +[2023-09-14 15:01:48,551][63735] DAMAGECOUNT value on done: 10928.0 +[2023-09-14 15:01:48,927][63735] DAMAGECOUNT value on done: 14881.0 +[2023-09-14 15:01:48,927][63735] Sum rewards: -0.944, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.074', 'AMMO4': '-0.017', 'AMMO2': '-0.003', 'WEAPON1': '0.010', 'AMMO5': '0.010', 'ARMOR': '0.036', 'weapon7': '0.080', 'weapon5': '0.096', 'WEAPON4': '0.100', 'weapon4': '0.104', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.144', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'HITCOUNT': '0.400', 'WEAPON3': '0.900', 'weapon2': '0.928', 'DAMAGECOUNT': '1.614', 'FRAGCOUNT': '2.000', 'weapon3': '2.038'} +[2023-09-14 15:01:49,271][63733] Updated weights for policy 1, policy_version 2080 (0.0013) +[2023-09-14 15:01:49,399][63771] DAMAGECOUNT value on done: 12246.0 +[2023-09-14 15:01:49,399][63771] Sum rewards: -6.233, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.282', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'AMMO5': '0.010', 'ARMOR': '0.068', 'weapon5': '0.114', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'AMMO3': '0.214', 'DAMAGECOUNT': '0.705', 'WEAPON3': '1.000', 'weapon2': '1.754', 'weapon3': '1.798', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:49,789][63771] DAMAGECOUNT value on done: 9882.0 +[2023-09-14 15:01:49,790][63771] Sum rewards: -7.464, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.582', 'AMMO4': '-0.016', 'AMMO2': '-0.003', 'weapon5': '0.004', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'ARMOR': '0.064', 'HITCOUNT': '0.100', 'AMMO3': '0.111', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.312', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.670', 'weapon2': '1.996'} +[2023-09-14 15:01:49,863][63734] DAMAGECOUNT value on done: 13828.0 +[2023-09-14 15:01:49,863][63734] Sum rewards: -1.524, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.098', 'AMMO2': '0.003', 'AMMO5': '0.014', 'AMMO4': '0.015', 'WEAPON1': '0.040', 'WEAPON4': '0.100', 'AMMO3': '0.110', 'HITCOUNT': '0.160', 'weapon5': '0.168', 'weapon4': '0.240', 'WEAPON5': '0.300', 'ARMOR': '0.468', 'WEAPON3': '0.700', 'weapon2': '1.094', 'DAMAGECOUNT': '1.119', 'weapon3': '1.542', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:50,195][63734] DAMAGECOUNT value on done: 11563.0 +[2023-09-14 15:01:50,196][63734] Sum rewards: -0.892, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.432', 'AMMO5': '0.003', 'weapon5': '0.006', 'ARMOR': '0.012', 'AMMO2': '0.013', 'WEAPON1': '0.040', 'weapon4': '0.044', 'WEAPON5': '0.050', 'AMMO4': '0.065', 'WEAPON4': '0.100', 'AMMO3': '0.156', 'HITCOUNT': '0.200', 'DAMAGECOUNT': '0.615', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.340', 'weapon3': '1.896'} +[2023-09-14 15:01:51,538][63767] DAMAGECOUNT value on done: 13883.0 +[2023-09-14 15:01:51,539][63767] Sum rewards: -0.890, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.528', 'AMMO2': '0.007', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO4': '0.034', 'WEAPON4': '0.050', 'ARMOR': '0.084', 'weapon5': '0.102', 'weapon4': '0.120', 'AMMO3': '0.122', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.850', 'weapon2': '1.380', 'weapon3': '1.996', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:01:51,928][63767] DAMAGECOUNT value on done: 13450.0 +[2023-09-14 15:01:51,928][63767] Sum rewards: -4.531, reward structure: {'DEATHCOUNT': '-9.750', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.212', 'AMMO2': '0.011', 'WEAPON1': '0.020', 'AMMO5': '0.020', 'AMMO4': '0.054', 'ARMOR': '0.057', 'weapon5': '0.086', 'weapon4': '0.094', 'WEAPON4': '0.100', 'AMMO3': '0.125', 'HITCOUNT': '0.200', 'WEAPON5': '0.350', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.086', 'weapon2': '1.426', 'weapon3': '1.652'} +[2023-09-14 15:01:52,569][63769] DAMAGECOUNT value on done: 13543.0 +[2023-09-14 15:01:52,569][63769] Sum rewards: 2.584, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.990', 'ARMOR': '0.016', 'AMMO2': '0.023', 'AMMO5': '0.024', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'AMMO4': '0.115', 'AMMO3': '0.130', 'weapon4': '0.212', 'weapon5': '0.218', 'HITCOUNT': '0.290', 'WEAPON5': '0.350', 'WEAPON3': '0.750', 'weapon2': '0.794', 'DAMAGECOUNT': '1.170', 'weapon3': '1.902', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:01:52,923][63769] DAMAGECOUNT value on done: 9561.0 +[2023-09-14 15:01:52,924][63769] Sum rewards: -1.077, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.500', 'AMMO5': '0.007', 'AMMO2': '0.015', 'ARMOR': '0.020', 'weapon5': '0.034', 'WEAPON5': '0.050', 'AMMO4': '0.073', 'weapon7': '0.082', 'AMMO3': '0.120', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.250', 'weapon4': '0.368', 'weapon2': '0.726', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.930', 'FRAGCOUNT': '1.000', 'weapon3': '2.058'} +[2023-09-14 15:01:54,239][63733] Updated weights for policy 1, policy_version 2090 (0.0011) +[2023-09-14 15:01:54,473][63770] DAMAGECOUNT value on done: 14423.0 +[2023-09-14 15:01:54,881][63770] DAMAGECOUNT value on done: 10448.0 +[2023-09-14 15:01:54,881][63770] Sum rewards: -3.901, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.568', 'AMMO4': '-0.047', 'AMMO2': '-0.009', 'AMMO5': '0.008', 'ARMOR': '0.064', 'weapon5': '0.100', 'AMMO3': '0.172', 'WEAPON5': '0.200', 'HITCOUNT': '0.310', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.125', 'weapon2': '1.458', 'weapon3': '1.986', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:54,959][63805] DAMAGECOUNT value on done: 13349.0 +[2023-09-14 15:01:54,959][63805] Sum rewards: -2.177, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.460', 'AMMO2': '0.010', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'weapon5': '0.022', 'AMMO4': '0.047', 'weapon4': '0.074', 'ARMOR': '0.094', 'AMMO3': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'HITCOUNT': '0.240', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.972', 'weapon2': '1.568', 'weapon3': '1.924', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:01:55,338][63805] DAMAGECOUNT value on done: 10821.0 +[2023-09-14 15:01:55,339][63805] Sum rewards: -6.591, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-3.008', 'weapon5': '0.002', 'AMMO2': '0.006', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.029', 'HITCOUNT': '0.100', 'WEAPON5': '0.150', 'AMMO3': '0.171', 'ARMOR': '0.448', 'DAMAGECOUNT': '0.450', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.200', 'weapon2': '1.270', 'weapon3': '2.064'} +[2023-09-14 15:01:55,483][63734] DAMAGECOUNT value on done: 12027.0 +[2023-09-14 15:01:55,874][63734] DAMAGECOUNT value on done: 12248.0 +[2023-09-14 15:01:55,875][63734] Sum rewards: -1.135, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.046', 'AMMO2': '0.007', 'AMMO5': '0.010', 'AMMO4': '0.034', 'WEAPON1': '0.080', 'AMMO3': '0.091', 'weapon5': '0.148', 'HITCOUNT': '0.190', 'WEAPON5': '0.300', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.903', 'weapon3': '1.592', 'weapon2': '1.606', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:01:59,300][63732] Updated weights for policy 0, policy_version 2070 (0.0011) +[2023-09-14 15:01:59,474][63733] Updated weights for policy 1, policy_version 2100 (0.0013) +[2023-09-14 15:02:00,691][63767] DAMAGECOUNT value on done: 14497.0 +[2023-09-14 15:02:00,691][63767] Sum rewards: 2.867, reward structure: {'DEATHCOUNT': '-5.250', 'weapon4': '0.008', 'AMMO5': '0.017', 'AMMO2': '0.022', 'ARMOR': '0.036', 'WEAPON1': '0.060', 'AMMO3': '0.071', 'WEAPON4': '0.100', 'AMMO4': '0.109', 'HEALTH': '0.160', 'HITCOUNT': '0.190', 'weapon5': '0.206', 'WEAPON5': '0.350', 'WEAPON3': '0.450', 'DAMAGECOUNT': '1.155', 'weapon3': '1.586', 'weapon2': '1.596', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:01,124][63767] DAMAGECOUNT value on done: 16817.0 +[2023-09-14 15:02:01,125][63767] Sum rewards: -3.633, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.616', 'weapon5': '0.002', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'AMMO5': '0.013', 'AMMO4': '0.037', 'ARMOR': '0.040', 'WEAPON5': '0.150', 'AMMO3': '0.181', 'HITCOUNT': '0.220', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.005', 'weapon2': '1.300', 'weapon3': '2.118', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:02:02,337][63771] DAMAGECOUNT value on done: 11423.0 +[2023-09-14 15:02:02,337][63771] Sum rewards: -1.119, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.527', 'AMMO5': '0.005', 'AMMO2': '0.022', 'weapon5': '0.060', 'WEAPON5': '0.100', 'ARMOR': '0.109', 'AMMO4': '0.109', 'AMMO3': '0.120', 'HITCOUNT': '0.160', 'WEAPON4': '0.300', 'weapon4': '0.344', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.717', 'weapon2': '1.564', 'weapon3': '1.698', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:02,735][63771] DAMAGECOUNT value on done: 14140.0 +[2023-09-14 15:02:02,807][63769] DAMAGECOUNT value on done: 12690.0 +[2023-09-14 15:02:02,807][63769] Sum rewards: -2.725, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.896', 'AMMO2': '0.007', 'weapon5': '0.014', 'AMMO5': '0.015', 'AMMO4': '0.035', 'WEAPON1': '0.040', 'weapon7': '0.068', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.155', 'WEAPON7': '0.200', 'HITCOUNT': '0.240', 'WEAPON5': '0.300', 'ARMOR': '0.461', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.906', 'weapon2': '1.110', 'FRAGCOUNT': '2.000', 'weapon3': '2.230'} +[2023-09-14 15:02:03,132][63769] DAMAGECOUNT value on done: 11515.0 +[2023-09-14 15:02:04,672][63733] Updated weights for policy 1, policy_version 2110 (0.0012) +[2023-09-14 15:02:05,073][63770] DAMAGECOUNT value on done: 10884.0 +[2023-09-14 15:02:05,073][63770] Sum rewards: -1.707, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.593', 'AMMO5': '0.005', 'weapon4': '0.006', 'AMMO2': '0.023', 'ARMOR': '0.024', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'WEAPON5': '0.100', 'AMMO4': '0.113', 'AMMO3': '0.142', 'HITCOUNT': '0.180', 'weapon5': '0.198', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.900', 'weapon2': '1.244', 'FRAGCOUNT': '2.000', 'weapon3': '2.196'} +[2023-09-14 15:02:05,473][63770] DAMAGECOUNT value on done: 13311.0 +[2023-09-14 15:02:05,473][63770] Sum rewards: -2.423, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.108', 'AMMO5': '0.010', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.061', 'ARMOR': '0.088', 'weapon4': '0.092', 'AMMO3': '0.124', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'HITCOUNT': '0.250', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.041', 'weapon2': '1.638', 'weapon3': '1.848', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:02:07,117][63805] DAMAGECOUNT value on done: 14272.0 +[2023-09-14 15:02:07,117][63805] Sum rewards: -2.396, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.426', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO2': '0.031', 'ARMOR': '0.068', 'HITCOUNT': '0.070', 'weapon5': '0.080', 'AMMO3': '0.121', 'WEAPON5': '0.150', 'AMMO4': '0.157', 'weapon4': '0.248', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.315', 'WEAPON3': '0.800', 'weapon2': '1.198', 'weapon3': '1.764', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:07,515][63805] DAMAGECOUNT value on done: 15368.0 +[2023-09-14 15:02:07,515][63805] Sum rewards: -5.361, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.946', 'AMMO5': '0.013', 'AMMO2': '0.014', 'WEAPON1': '0.030', 'AMMO4': '0.068', 'ARMOR': '0.072', 'weapon5': '0.124', 'AMMO3': '0.168', 'HITCOUNT': '0.210', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.585', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon2': '1.450', 'weapon3': '2.052'} +[2023-09-14 15:02:08,852][63806] DAMAGECOUNT value on done: 11829.0 +[2023-09-14 15:02:09,226][63806] DAMAGECOUNT value on done: 12332.0 +[2023-09-14 15:02:09,226][63806] Sum rewards: -2.422, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.216', 'AMMO5': '0.007', 'AMMO2': '0.022', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'weapon5': '0.054', 'weapon4': '0.076', 'AMMO4': '0.107', 'ARMOR': '0.112', 'AMMO3': '0.125', 'WEAPON5': '0.150', 'HITCOUNT': '0.360', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.020', 'weapon2': '1.590', 'weapon3': '1.840', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:09,728][63733] Updated weights for policy 1, policy_version 2120 (0.0011) +[2023-09-14 15:02:10,628][63806] DAMAGECOUNT value on done: 12061.0 +[2023-09-14 15:02:10,628][63806] Sum rewards: 3.656, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.034', 'AMMO5': '0.005', 'AMMO2': '0.007', 'weapon5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.034', 'AMMO3': '0.094', 'WEAPON5': '0.100', 'ARMOR': '0.104', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'weapon4': '0.488', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.726', 'weapon2': '1.528', 'weapon3': '1.552', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:02:11,080][63806] DAMAGECOUNT value on done: 12120.0 +[2023-09-14 15:02:11,081][63806] Sum rewards: -4.288, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.735', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.008', 'AMMO5': '0.015', 'AMMO4': '0.037', 'ARMOR': '0.044', 'HITCOUNT': '0.110', 'weapon5': '0.116', 'AMMO3': '0.126', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.285', 'WEAPON3': '0.750', 'weapon2': '1.504', 'weapon3': '1.952'} +[2023-09-14 15:02:11,646][63735] DAMAGECOUNT value on done: 13318.0 +[2023-09-14 15:02:11,646][63735] Sum rewards: -3.993, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.670', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO2': '0.020', 'HITCOUNT': '0.030', 'weapon4': '0.044', 'AMMO4': '0.102', 'AMMO3': '0.102', 'DAMAGECOUNT': '0.105', 'ARMOR': '0.120', 'WEAPON5': '0.150', 'WEAPON4': '0.200', 'weapon5': '0.232', 'WEAPON3': '0.650', 'weapon2': '1.402', 'weapon3': '1.742'} +[2023-09-14 15:02:11,979][63734] DAMAGECOUNT value on done: 14054.0 +[2023-09-14 15:02:11,980][63734] Sum rewards: -0.584, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.804', 'AMMO2': '0.002', 'AMMO4': '0.012', 'AMMO5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.035', 'weapon5': '0.046', 'AMMO3': '0.108', 'HITCOUNT': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.678', 'weapon2': '1.458', 'weapon3': '1.546', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:12,004][63735] DAMAGECOUNT value on done: 9664.0 +[2023-09-14 15:02:12,005][63735] Sum rewards: -0.750, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.621', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'AMMO3': '0.063', 'HITCOUNT': '0.110', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.366', 'FRAGCOUNT': '1.000', 'weapon3': '1.054', 'weapon2': '1.438'} +[2023-09-14 15:02:12,141][63732] Updated weights for policy 0, policy_version 2080 (0.0010) +[2023-09-14 15:02:12,356][63734] DAMAGECOUNT value on done: 11934.0 +[2023-09-14 15:02:12,356][63734] Sum rewards: -3.324, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.226', 'AMMO5': '0.010', 'AMMO2': '0.014', 'AMMO4': '0.071', 'ARMOR': '0.100', 'weapon5': '0.126', 'WEAPON4': '0.150', 'AMMO3': '0.163', 'HITCOUNT': '0.200', 'WEAPON5': '0.250', 'weapon4': '0.334', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.113', 'weapon2': '1.452', 'weapon3': '1.518', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:13,621][63735] DAMAGECOUNT value on done: 11189.0 +[2023-09-14 15:02:13,622][63735] Sum rewards: -4.657, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.806', 'AMMO5': '0.010', 'weapon5': '0.010', 'AMMO2': '0.016', 'WEAPON1': '0.020', 'ARMOR': '0.072', 'AMMO4': '0.079', 'AMMO3': '0.119', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.783', 'FRAGCOUNT': '1.000', 'weapon3': '1.198', 'weapon2': '2.262'} +[2023-09-14 15:02:14,004][63735] DAMAGECOUNT value on done: 15136.0 +[2023-09-14 15:02:14,004][63735] Sum rewards: -1.960, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.660', 'AMMO4': '-0.043', 'AMMO2': '-0.009', 'WEAPON1': '0.020', 'AMMO5': '0.026', 'AMMO3': '0.131', 'weapon5': '0.170', 'HITCOUNT': '0.210', 'WEAPON5': '0.400', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.765', 'weapon3': '1.352', 'weapon2': '1.376', 'FRAGCOUNT': '1.500'} +[2023-09-14 15:02:14,519][63771] DAMAGECOUNT value on done: 12519.0 +[2023-09-14 15:02:14,520][63771] Sum rewards: -3.133, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.896', 'AMMO2': '0.008', 'AMMO5': '0.015', 'WEAPON1': '0.030', 'AMMO4': '0.041', 'ARMOR': '0.068', 'WEAPON4': '0.100', 'weapon4': '0.136', 'weapon5': '0.138', 'AMMO3': '0.208', 'HITCOUNT': '0.240', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.819', 'WEAPON3': '0.900', 'weapon2': '1.240', 'FRAGCOUNT': '2.000', 'weapon3': '2.020'} +[2023-09-14 15:02:14,631][63769] DAMAGECOUNT value on done: 14241.0 +[2023-09-14 15:02:14,632][63769] Sum rewards: -2.188, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.430', 'FRAGCOUNT': '0.000', 'weapon7': '0.004', 'AMMO2': '0.005', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.026', 'ARMOR': '0.040', 'WEAPON4': '0.100', 'AMMO3': '0.102', 'weapon4': '0.106', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.252', 'HITCOUNT': '0.290', 'WEAPON5': '0.350', 'WEAPON3': '0.650', 'weapon2': '1.080', 'weapon3': '1.760', 'DAMAGECOUNT': '2.094'} +[2023-09-14 15:02:14,801][63733] Updated weights for policy 1, policy_version 2130 (0.0010) +[2023-09-14 15:02:14,976][63771] DAMAGECOUNT value on done: 10092.0 +[2023-09-14 15:02:14,976][63771] Sum rewards: -2.533, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.668', 'AMMO5': '0.023', 'AMMO2': '0.028', 'WEAPON1': '0.040', 'AMMO3': '0.064', 'AMMO4': '0.140', 'weapon4': '0.142', 'WEAPON4': '0.150', 'HITCOUNT': '0.190', 'weapon5': '0.264', 'WEAPON5': '0.350', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.630', 'FRAGCOUNT': '1.000', 'weapon3': '1.476', 'weapon2': '1.588'} +[2023-09-14 15:02:15,000][63769] DAMAGECOUNT value on done: 9723.0 +[2023-09-14 15:02:15,001][63769] Sum rewards: -3.400, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.980', 'AMMO2': '0.007', 'AMMO5': '0.017', 'WEAPON1': '0.030', 'AMMO4': '0.033', 'ARMOR': '0.040', 'HITCOUNT': '0.120', 'AMMO3': '0.139', 'weapon5': '0.290', 'WEAPON5': '0.450', 'DAMAGECOUNT': '0.486', 'WEAPON3': '0.900', 'weapon2': '1.118', 'weapon3': '1.950', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:15,109][63767] DAMAGECOUNT value on done: 14296.0 +[2023-09-14 15:02:15,110][63767] Sum rewards: -1.805, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.370', 'AMMO5': '0.005', 'AMMO2': '0.022', 'weapon7': '0.072', 'ARMOR': '0.096', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.108', 'AMMO3': '0.111', 'WEAPON4': '0.150', 'weapon4': '0.224', 'HITCOUNT': '0.320', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.239', 'weapon2': '1.582', 'weapon3': '1.686'} +[2023-09-14 15:02:15,496][63767] DAMAGECOUNT value on done: 13580.0 +[2023-09-14 15:02:18,579][63805] DAMAGECOUNT value on done: 13704.0 +[2023-09-14 15:02:18,580][63805] Sum rewards: 1.712, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.482', 'AMMO5': '0.005', 'AMMO2': '0.006', 'AMMO4': '0.029', 'weapon4': '0.060', 'AMMO3': '0.095', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'ARMOR': '0.104', 'HITCOUNT': '0.260', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.065', 'weapon3': '1.332', 'weapon2': '2.188', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:02:18,991][63805] DAMAGECOUNT value on done: 10995.0 +[2023-09-14 15:02:18,991][63805] Sum rewards: -1.159, reward structure: {'DEATHCOUNT': '-5.250', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.318', 'AMMO5': '0.006', 'AMMO2': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.034', 'WEAPON4': '0.050', 'ARMOR': '0.076', 'weapon4': '0.094', 'AMMO3': '0.098', 'weapon5': '0.148', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.522', 'WEAPON3': '0.600', 'weapon2': '1.314', 'weapon3': '1.620'} +[2023-09-14 15:02:19,563][63734] DAMAGECOUNT value on done: 12252.0 +[2023-09-14 15:02:19,683][63770] DAMAGECOUNT value on done: 14558.0 +[2023-09-14 15:02:19,684][63770] Sum rewards: -4.432, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.737', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.007', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO4': '0.036', 'ARMOR': '0.050', 'WEAPON4': '0.050', 'weapon5': '0.086', 'WEAPON5': '0.100', 'AMMO3': '0.121', 'HITCOUNT': '0.150', 'weapon4': '0.150', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.650', 'weapon3': '1.504', 'weapon2': '1.718'} +[2023-09-14 15:02:19,860][63733] Updated weights for policy 1, policy_version 2140 (0.0012) +[2023-09-14 15:02:19,943][63734] DAMAGECOUNT value on done: 12288.0 +[2023-09-14 15:02:20,103][63770] DAMAGECOUNT value on done: 10833.0 +[2023-09-14 15:02:20,103][63770] Sum rewards: 1.270, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.001', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.018', 'ARMOR': '0.032', 'AMMO4': '0.088', 'WEAPON5': '0.100', 'AMMO3': '0.131', 'weapon5': '0.132', 'WEAPON4': '0.200', 'HITCOUNT': '0.260', 'weapon4': '0.374', 'WEAPON3': '0.650', 'weapon2': '0.714', 'DAMAGECOUNT': '1.155', 'FRAGCOUNT': '2.000', 'weapon3': '2.152'} +[2023-09-14 15:02:24,146][63767] DAMAGECOUNT value on done: 14707.0 +[2023-09-14 15:02:24,147][63767] Sum rewards: 0.632, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.140', 'AMMO5': '0.010', 'AMMO2': '0.013', 'AMMO4': '0.064', 'weapon5': '0.068', 'WEAPON1': '0.070', 'AMMO3': '0.079', 'HITCOUNT': '0.150', 'WEAPON5': '0.200', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.630', 'FRAGCOUNT': '1.000', 'weapon3': '1.492', 'weapon2': '1.696'} +[2023-09-14 15:02:24,530][63767] DAMAGECOUNT value on done: 17108.0 +[2023-09-14 15:02:24,530][63767] Sum rewards: 0.040, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.158', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.013', 'AMMO4': '0.066', 'weapon5': '0.078', 'WEAPON4': '0.100', 'ARMOR': '0.116', 'AMMO3': '0.136', 'WEAPON5': '0.150', 'HITCOUNT': '0.260', 'weapon4': '0.362', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.873', 'weapon3': '1.150', 'weapon2': '1.524', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:02:24,851][63733] Updated weights for policy 1, policy_version 2150 (0.0010) +[2023-09-14 15:02:24,888][63732] Updated weights for policy 0, policy_version 2090 (0.0012) +[2023-09-14 15:02:26,234][63771] DAMAGECOUNT value on done: 11563.0 +[2023-09-14 15:02:26,235][63771] Sum rewards: -1.880, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.140', 'AMMO5': '0.007', 'AMMO2': '0.008', 'AMMO4': '0.042', 'ARMOR': '0.052', 'weapon5': '0.066', 'weapon4': '0.078', 'HITCOUNT': '0.090', 'AMMO3': '0.106', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.600', 'weapon3': '1.406', 'weapon2': '1.584', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:26,496][63735] Large shaping reward -2.549 for [('FRAGCOUNT', -1.5, -1.0), ('DEATHCOUNT', -0.75, 1.0), ('HEALTH', -0.3, -100.0), ('AMMO5', -0.0005, -1.0), ('weapon5', 0.002)] +[2023-09-14 15:02:26,641][63771] DAMAGECOUNT value on done: 14265.0 +[2023-09-14 15:02:26,641][63771] Sum rewards: 1.121, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.952', 'AMMO5': '0.003', 'AMMO2': '0.015', 'ARMOR': '0.034', 'weapon7': '0.050', 'AMMO3': '0.060', 'AMMO4': '0.072', 'HITCOUNT': '0.110', 'weapon4': '0.154', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.375', 'weapon3': '1.018', 'weapon2': '1.662', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:27,466][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002092_8568832.pth... +[2023-09-14 15:02:27,466][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000002155_8826880.pth... +[2023-09-14 15:02:27,526][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001741_7131136.pth +[2023-09-14 15:02:27,527][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001846_7561216.pth +[2023-09-14 15:02:27,534][63576] Saving new best policy, reward=-2.247! +[2023-09-14 15:02:27,663][63769] DAMAGECOUNT value on done: 13249.0 +[2023-09-14 15:02:27,663][63769] Sum rewards: -0.348, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.476', 'AMMO2': '0.002', 'AMMO4': '0.008', 'AMMO5': '0.027', 'WEAPON1': '0.040', 'AMMO3': '0.147', 'weapon5': '0.296', 'HITCOUNT': '0.340', 'WEAPON5': '0.550', 'WEAPON3': '0.750', 'weapon2': '1.442', 'DAMAGECOUNT': '1.677', 'weapon3': '1.848', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:02:28,088][63769] DAMAGECOUNT value on done: 11850.0 +[2023-09-14 15:02:28,088][63769] Sum rewards: -1.230, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.100', 'AMMO2': '0.014', 'AMMO5': '0.015', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'weapon4': '0.050', 'AMMO4': '0.072', 'ARMOR': '0.088', 'AMMO3': '0.098', 'weapon5': '0.102', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'WEAPON3': '0.450', 'DAMAGECOUNT': '1.005', 'weapon3': '1.426', 'FRAGCOUNT': '1.500', 'weapon2': '1.750'} +[2023-09-14 15:02:29,001][63770] DAMAGECOUNT value on done: 10954.0 +[2023-09-14 15:02:29,378][63770] DAMAGECOUNT value on done: 13608.0 +[2023-09-14 15:02:29,378][63770] Sum rewards: -1.957, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.760', 'AMMO2': '0.004', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'ARMOR': '0.016', 'AMMO4': '0.022', 'weapon5': '0.040', 'WEAPON5': '0.050', 'AMMO3': '0.164', 'HITCOUNT': '0.260', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.891', 'weapon3': '1.470', 'weapon2': '1.918', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:02:29,917][63733] Updated weights for policy 1, policy_version 2160 (0.0010) +[2023-09-14 15:02:30,651][63805] DAMAGECOUNT value on done: 14307.0 +[2023-09-14 15:02:31,047][63805] DAMAGECOUNT value on done: 15623.0 +[2023-09-14 15:02:31,048][63805] Sum rewards: -6.425, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.926', 'AMMO2': '0.008', 'AMMO4': '0.039', 'WEAPON4': '0.100', 'AMMO3': '0.159', 'HITCOUNT': '0.190', 'weapon4': '0.244', 'ARMOR': '0.588', 'DAMAGECOUNT': '0.765', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.390', 'weapon3': '1.468'} +[2023-09-14 15:02:32,069][63806] DAMAGECOUNT value on done: 11994.0 +[2023-09-14 15:02:32,070][63806] Sum rewards: -10.252, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-3.680', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'AMMO5': '0.020', 'weapon5': '0.028', 'ARMOR': '0.092', 'HITCOUNT': '0.170', 'AMMO3': '0.236', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.495', 'FRAGCOUNT': '1.000', 'weapon2': '1.226', 'WEAPON3': '1.400', 'weapon3': '1.992'} +[2023-09-14 15:02:32,388][63806] DAMAGECOUNT value on done: 12417.0 +[2023-09-14 15:02:34,011][63734] DAMAGECOUNT value on done: 14559.0 +[2023-09-14 15:02:34,012][63734] Sum rewards: 4.967, reward structure: {'DEATHCOUNT': '-4.500', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.013', 'ARMOR': '0.036', 'AMMO4': '0.064', 'AMMO3': '0.077', 'HEALTH': '0.144', 'WEAPON5': '0.150', 'HITCOUNT': '0.150', 'weapon5': '0.166', 'WEAPON3': '0.300', 'weapon2': '1.388', 'weapon3': '1.446', 'DAMAGECOUNT': '1.515', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:02:34,375][63734] DAMAGECOUNT value on done: 12638.0 +[2023-09-14 15:02:34,376][63734] Sum rewards: -1.896, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.572', 'weapon7': '0.008', 'AMMO2': '0.010', 'AMMO5': '0.014', 'AMMO4': '0.052', 'ARMOR': '0.068', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.144', 'AMMO3': '0.190', 'weapon5': '0.204', 'WEAPON5': '0.350', 'HITCOUNT': '0.480', 'weapon2': '1.036', 'WEAPON3': '1.150', 'DAMAGECOUNT': '2.112', 'weapon3': '2.208', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:02:34,834][63806] DAMAGECOUNT value on done: 12243.0 +[2023-09-14 15:02:34,834][63806] Sum rewards: -9.430, reward structure: {'DEATHCOUNT': '-14.250', 'HEALTH': '-2.327', 'AMMO5': '0.007', 'AMMO2': '0.019', 'WEAPON1': '0.020', 'weapon4': '0.052', 'AMMO4': '0.094', 'HITCOUNT': '0.130', 'WEAPON5': '0.150', 'AMMO3': '0.177', 'WEAPON4': '0.250', 'ARMOR': '0.497', 'DAMAGECOUNT': '0.546', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.494', 'weapon3': '1.760'} +[2023-09-14 15:02:35,014][63733] Updated weights for policy 1, policy_version 2170 (0.0010) +[2023-09-14 15:02:35,196][63735] DAMAGECOUNT value on done: 13613.0 +[2023-09-14 15:02:35,196][63735] Sum rewards: -0.227, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.569', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.022', 'WEAPON5': '0.050', 'ARMOR': '0.056', 'weapon4': '0.066', 'AMMO3': '0.099', 'WEAPON4': '0.100', 'AMMO4': '0.109', 'HITCOUNT': '0.210', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.885', 'FRAGCOUNT': '1.000', 'weapon2': '1.538', 'weapon3': '1.644'} +[2023-09-14 15:02:35,205][63806] DAMAGECOUNT value on done: 12461.0 +[2023-09-14 15:02:35,205][63806] Sum rewards: -2.540, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.051', 'AMMO2': '0.014', 'AMMO5': '0.015', 'ARMOR': '0.016', 'WEAPON1': '0.030', 'AMMO4': '0.068', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'weapon4': '0.116', 'HITCOUNT': '0.170', 'weapon5': '0.260', 'WEAPON5': '0.350', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.951', 'weapon2': '1.484', 'weapon3': '1.824'} +[2023-09-14 15:02:35,576][63735] DAMAGECOUNT value on done: 9779.0 +[2023-09-14 15:02:35,576][63735] Sum rewards: -3.141, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.026', 'AMMO5': '0.005', 'AMMO2': '0.007', 'weapon5': '0.010', 'WEAPON1': '0.020', 'AMMO4': '0.034', 'WEAPON5': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.132', 'ARMOR': '0.148', 'WEAPON4': '0.150', 'weapon4': '0.204', 'DAMAGECOUNT': '0.345', 'WEAPON3': '0.700', 'weapon3': '1.426', 'weapon2': '1.494', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:36,577][63769] DAMAGECOUNT value on done: 14424.0 +[2023-09-14 15:02:36,577][63769] Sum rewards: -1.374, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.140', 'AMMO2': '0.005', 'weapon4': '0.016', 'AMMO5': '0.017', 'AMMO4': '0.023', 'WEAPON1': '0.030', 'ARMOR': '0.030', 'WEAPON4': '0.100', 'AMMO3': '0.144', 'HITCOUNT': '0.190', 'weapon5': '0.250', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.549', 'WEAPON3': '0.850', 'weapon2': '1.132', 'weapon3': '2.080', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:02:36,890][63769] DAMAGECOUNT value on done: 9943.0 +[2023-09-14 15:02:36,890][63769] Sum rewards: 0.297, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO5': '0.005', 'AMMO2': '0.021', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'weapon5': '0.092', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO4': '0.103', 'AMMO3': '0.118', 'weapon7': '0.122', 'weapon4': '0.204', 'HITCOUNT': '0.210', 'HEALTH': '0.228', 'ARMOR': '0.424', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.660', 'weapon2': '1.152', 'weapon3': '1.358', 'FRAGCOUNT': '1.500'} +[2023-09-14 15:02:37,472][63732] Updated weights for policy 0, policy_version 2100 (0.0011) +[2023-09-14 15:02:37,944][63735] DAMAGECOUNT value on done: 11426.0 +[2023-09-14 15:02:37,945][63735] Sum rewards: -1.696, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.904', 'AMMO2': '0.001', 'AMMO5': '0.004', 'AMMO4': '0.006', 'ARMOR': '0.040', 'weapon5': '0.044', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.140', 'HITCOUNT': '0.150', 'weapon4': '0.240', 'DAMAGECOUNT': '0.711', 'WEAPON3': '0.800', 'weapon2': '0.964', 'weapon3': '1.908', 'FRAGCOUNT': '2.500'} +[2023-09-14 15:02:38,348][63735] DAMAGECOUNT value on done: 15301.0 +[2023-09-14 15:02:38,348][63735] Sum rewards: -1.909, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.797', 'AMMO4': '-0.030', 'AMMO2': '-0.006', 'WEAPON4': '0.050', 'ARMOR': '0.080', 'AMMO3': '0.115', 'HITCOUNT': '0.190', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.354', 'weapon3': '1.840'} +[2023-09-14 15:02:38,847][63767] DAMAGECOUNT value on done: 14448.0 +[2023-09-14 15:02:39,237][63767] DAMAGECOUNT value on done: 13784.0 +[2023-09-14 15:02:39,238][63767] Sum rewards: -4.448, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.732', 'weapon5': '0.002', 'AMMO5': '0.003', 'AMMO2': '0.017', 'ARMOR': '0.036', 'WEAPON5': '0.050', 'weapon4': '0.056', 'AMMO4': '0.083', 'AMMO3': '0.136', 'HITCOUNT': '0.160', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.612', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.102', 'weapon3': '1.928'} +[2023-09-14 15:02:39,369][63771] DAMAGECOUNT value on done: 12852.0 +[2023-09-14 15:02:39,369][63771] Sum rewards: -4.008, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.812', 'AMMO2': '0.005', 'AMMO5': '0.008', 'WEAPON1': '0.010', 'weapon5': '0.026', 'AMMO4': '0.026', 'ARMOR': '0.051', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'AMMO3': '0.151', 'weapon4': '0.152', 'HITCOUNT': '0.320', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.999', 'weapon2': '1.620', 'weapon3': '1.736', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:39,756][63771] DAMAGECOUNT value on done: 10112.0 +[2023-09-14 15:02:39,756][63771] Sum rewards: -5.713, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.724', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'AMMO5': '0.018', 'HITCOUNT': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.054', 'DAMAGECOUNT': '0.060', 'AMMO3': '0.130', 'WEAPON5': '0.300', 'weapon5': '0.388', 'WEAPON3': '0.700', 'weapon2': '1.436', 'weapon3': '1.602'} +[2023-09-14 15:02:40,055][63733] Updated weights for policy 1, policy_version 2180 (0.0011) +[2023-09-14 15:02:42,058][63805] DAMAGECOUNT value on done: 13876.0 +[2023-09-14 15:02:42,059][63805] Sum rewards: -0.263, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.414', 'AMMO2': '0.005', 'WEAPON1': '0.010', 'AMMO4': '0.027', 'AMMO3': '0.092', 'HITCOUNT': '0.140', 'ARMOR': '0.497', 'DAMAGECOUNT': '0.516', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.582', 'weapon2': '1.732'} +[2023-09-14 15:02:42,409][63805] DAMAGECOUNT value on done: 11155.0 +[2023-09-14 15:02:42,410][63805] Sum rewards: -4.815, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.290', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'ARMOR': '0.024', 'weapon4': '0.032', 'weapon5': '0.032', 'AMMO2': '0.040', 'WEAPON5': '0.050', 'HITCOUNT': '0.120', 'AMMO3': '0.135', 'AMMO4': '0.199', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.480', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.442', 'weapon3': '1.708'} +[2023-09-14 15:02:43,375][63734] DAMAGECOUNT value on done: 12568.0 +[2023-09-14 15:02:43,376][63734] Sum rewards: -0.781, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.317', 'weapon5': '0.002', 'AMMO5': '0.007', 'AMMO2': '0.016', 'WEAPON1': '0.020', 'weapon4': '0.052', 'AMMO4': '0.080', 'AMMO3': '0.114', 'ARMOR': '0.116', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.240', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.948', 'weapon2': '1.424', 'weapon3': '1.816', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:43,759][63734] DAMAGECOUNT value on done: 12470.0 +[2023-09-14 15:02:43,760][63734] Sum rewards: -0.756, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.792', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'weapon5': '0.002', 'AMMO5': '0.005', 'weapon4': '0.012', 'WEAPON4': '0.050', 'AMMO3': '0.098', 'WEAPON5': '0.100', 'ARMOR': '0.104', 'HITCOUNT': '0.110', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.546', 'weapon3': '1.566', 'weapon2': '1.700', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:44,697][63770] DAMAGECOUNT value on done: 14698.0 +[2023-09-14 15:02:44,697][63770] Sum rewards: -8.123, reward structure: {'DEATHCOUNT': '-13.500', 'HEALTH': '-2.107', 'WEAPON1': '0.010', 'AMMO5': '0.010', 'AMMO2': '0.019', 'ARMOR': '0.060', 'weapon5': '0.086', 'AMMO4': '0.095', 'weapon4': '0.124', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'WEAPON5': '0.150', 'AMMO3': '0.156', 'DAMAGECOUNT': '0.420', 'WEAPON3': '0.900', 'weapon3': '1.284', 'weapon2': '1.890', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:45,042][63770] DAMAGECOUNT value on done: 11168.0 +[2023-09-14 15:02:45,043][63770] Sum rewards: 2.220, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.035', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO3': '0.093', 'WEAPON4': '0.100', 'weapon5': '0.158', 'HITCOUNT': '0.190', 'weapon4': '0.198', 'WEAPON5': '0.200', 'ARMOR': '0.511', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.005', 'weapon2': '1.294', 'weapon3': '1.640', 'FRAGCOUNT': '2.500'} +[2023-09-14 15:02:45,141][63733] Updated weights for policy 1, policy_version 2190 (0.0010) +[2023-09-14 15:02:48,249][63767] DAMAGECOUNT value on done: 14911.0 +[2023-09-14 15:02:48,249][63767] Sum rewards: -2.253, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.322', 'AMMO4': '-0.021', 'AMMO2': '-0.004', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'WEAPON5': '0.100', 'ARMOR': '0.104', 'AMMO3': '0.133', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.612', 'WEAPON3': '0.850', 'weapon2': '1.578', 'weapon3': '1.772', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:48,606][63767] DAMAGECOUNT value on done: 17413.0 +[2023-09-14 15:02:48,607][63767] Sum rewards: -0.090, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.500', 'AMMO2': '0.005', 'WEAPON1': '0.010', 'AMMO4': '0.025', 'WEAPON4': '0.050', 'ARMOR': '0.072', 'AMMO3': '0.079', 'weapon4': '0.104', 'HITCOUNT': '0.270', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.915', 'weapon2': '1.482', 'weapon3': '1.598', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:50,284][63733] Updated weights for policy 1, policy_version 2200 (0.0011) +[2023-09-14 15:02:50,305][63732] Updated weights for policy 0, policy_version 2110 (0.0010) +[2023-09-14 15:02:50,390][63771] DAMAGECOUNT value on done: 11778.0 +[2023-09-14 15:02:50,391][63771] Sum rewards: -0.304, reward structure: {'DEATHCOUNT': '-6.750', 'weapon5': '0.006', 'AMMO5': '0.007', 'AMMO2': '0.010', 'AMMO4': '0.049', 'AMMO3': '0.070', 'WEAPON4': '0.100', 'weapon4': '0.132', 'ARMOR': '0.139', 'HITCOUNT': '0.150', 'WEAPON5': '0.150', 'WEAPON3': '0.350', 'HEALTH': '0.606', 'DAMAGECOUNT': '0.645', 'FRAGCOUNT': '1.000', 'weapon3': '1.510', 'weapon2': '1.522'} +[2023-09-14 15:02:50,779][63771] DAMAGECOUNT value on done: 14530.0 +[2023-09-14 15:02:50,780][63771] Sum rewards: -4.145, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.749', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.014', 'ARMOR': '0.053', 'AMMO4': '0.069', 'weapon4': '0.072', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.125', 'HITCOUNT': '0.210', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.795', 'FRAGCOUNT': '1.000', 'weapon2': '1.620', 'weapon3': '1.678'} +[2023-09-14 15:02:52,579][63769] DAMAGECOUNT value on done: 13374.0 +[2023-09-14 15:02:52,580][63769] Sum rewards: -4.922, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-0.500', 'WEAPON1': '0.010', 'AMMO5': '0.017', 'ARMOR': '0.020', 'AMMO2': '0.031', 'weapon7': '0.064', 'HITCOUNT': '0.080', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon4': '0.120', 'AMMO3': '0.131', 'weapon5': '0.146', 'WEAPON4': '0.150', 'AMMO4': '0.153', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.375', 'HEALTH': '0.420', 'WEAPON3': '0.650', 'weapon2': '1.174', 'weapon3': '1.936'} +[2023-09-14 15:02:53,024][63769] DAMAGECOUNT value on done: 12095.0 +[2023-09-14 15:02:53,024][63769] Sum rewards: -3.861, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.424', 'AMMO5': '0.003', 'weapon5': '0.006', 'AMMO2': '0.019', 'WEAPON5': '0.050', 'ARMOR': '0.080', 'AMMO4': '0.093', 'weapon4': '0.096', 'AMMO3': '0.159', 'WEAPON4': '0.200', 'HITCOUNT': '0.230', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.735', 'FRAGCOUNT': '1.000', 'weapon2': '1.298', 'weapon3': '1.644'} +[2023-09-14 15:02:53,054][63770] DAMAGECOUNT value on done: 11097.0 +[2023-09-14 15:02:53,054][63770] Sum rewards: 1.323, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-1.152', 'AMMO2': '0.007', 'AMMO5': '0.013', 'ARMOR': '0.036', 'AMMO4': '0.037', 'WEAPON4': '0.050', 'AMMO3': '0.060', 'weapon4': '0.068', 'HITCOUNT': '0.090', 'weapon7': '0.104', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'weapon5': '0.326', 'DAMAGECOUNT': '0.429', 'WEAPON3': '0.450', 'weapon3': '1.094', 'weapon2': '1.520', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:53,440][63770] DAMAGECOUNT value on done: 13760.0 +[2023-09-14 15:02:54,088][63805] DAMAGECOUNT value on done: 14502.0 +[2023-09-14 15:02:54,089][63805] Sum rewards: 0.488, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.346', 'WEAPON1': '0.010', 'AMMO5': '0.013', 'AMMO2': '0.018', 'weapon4': '0.040', 'weapon5': '0.078', 'AMMO4': '0.087', 'WEAPON4': '0.100', 'AMMO3': '0.115', 'HITCOUNT': '0.190', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.585', 'ARMOR': '0.588', 'WEAPON3': '0.650', 'weapon2': '1.330', 'weapon3': '1.530', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:02:54,483][63805] DAMAGECOUNT value on done: 15763.0 +[2023-09-14 15:02:54,484][63805] Sum rewards: -1.960, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.261', 'AMMO2': '0.026', 'weapon4': '0.036', 'AMMO4': '0.128', 'AMMO3': '0.139', 'HITCOUNT': '0.140', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.420', 'ARMOR': '0.490', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.694', 'weapon2': '1.778'} +[2023-09-14 15:02:55,345][63733] Updated weights for policy 1, policy_version 2210 (0.0011) +[2023-09-14 15:02:55,560][63806] DAMAGECOUNT value on done: 12469.0 +[2023-09-14 15:02:55,560][63806] Sum rewards: -2.427, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.733', 'AMMO5': '0.007', 'AMMO2': '0.008', 'ARMOR': '0.024', 'AMMO4': '0.042', 'WEAPON5': '0.100', 'AMMO3': '0.175', 'HITCOUNT': '0.380', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.425', 'weapon2': '1.444', 'weapon3': '1.950', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:02:55,895][63734] DAMAGECOUNT value on done: 14843.0 +[2023-09-14 15:02:55,896][63734] Sum rewards: 2.862, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-0.441', 'AMMO5': '0.003', 'AMMO2': '0.011', 'weapon4': '0.030', 'WEAPON5': '0.050', 'AMMO4': '0.053', 'weapon5': '0.062', 'ARMOR': '0.064', 'WEAPON4': '0.100', 'AMMO3': '0.122', 'HITCOUNT': '0.210', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.852', 'weapon2': '1.168', 'weapon3': '1.878', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:55,960][63806] DAMAGECOUNT value on done: 12762.0 +[2023-09-14 15:02:55,960][63806] Sum rewards: -1.761, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.006', 'weapon5': '0.004', 'AMMO2': '0.005', 'AMMO5': '0.020', 'AMMO4': '0.026', 'ARMOR': '0.068', 'WEAPON4': '0.150', 'AMMO3': '0.155', 'WEAPON5': '0.200', 'weapon4': '0.214', 'HITCOUNT': '0.290', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.035', 'weapon2': '1.418', 'weapon3': '1.760', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:56,214][63734] DAMAGECOUNT value on done: 12808.0 +[2023-09-14 15:02:56,215][63734] Sum rewards: -0.850, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.955', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'weapon7': '0.054', 'weapon5': '0.072', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.140', 'weapon4': '0.158', 'HITCOUNT': '0.170', 'WEAPON7': '0.200', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.402', 'weapon3': '1.670'} +[2023-09-14 15:02:58,830][63769] DAMAGECOUNT value on done: 14693.0 +[2023-09-14 15:02:58,831][63769] Sum rewards: -0.621, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.472', 'AMMO5': '0.005', 'AMMO2': '0.012', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'AMMO4': '0.062', 'weapon5': '0.106', 'AMMO3': '0.121', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'weapon4': '0.272', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.807', 'weapon2': '1.350', 'weapon3': '1.452', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:02:58,974][63735] DAMAGECOUNT value on done: 13878.0 +[2023-09-14 15:02:58,975][63735] Sum rewards: -2.380, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.786', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'weapon5': '0.010', 'AMMO2': '0.045', 'WEAPON5': '0.050', 'AMMO3': '0.135', 'ARMOR': '0.135', 'HITCOUNT': '0.190', 'AMMO4': '0.227', 'weapon4': '0.256', 'WEAPON4': '0.450', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.795', 'weapon2': '1.248', 'weapon3': '1.652', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:02:59,193][63769] DAMAGECOUNT value on done: 10398.0 +[2023-09-14 15:02:59,193][63769] Sum rewards: 2.731, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.726', 'AMMO5': '0.007', 'AMMO2': '0.026', 'ARMOR': '0.036', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'weapon7': '0.090', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon4': '0.110', 'HITCOUNT': '0.120', 'AMMO3': '0.127', 'AMMO4': '0.128', 'WEAPON5': '0.200', 'weapon5': '0.206', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.909', 'weapon2': '1.150', 'weapon3': '1.658', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:02:59,299][63735] DAMAGECOUNT value on done: 10024.0 +[2023-09-14 15:02:59,300][63735] Sum rewards: -0.880, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-2.240', 'AMMO4': '-0.028', 'AMMO2': '-0.006', 'ARMOR': '0.020', 'AMMO3': '0.122', 'HITCOUNT': '0.180', 'DAMAGECOUNT': '0.735', 'WEAPON3': '0.850', 'weapon2': '1.178', 'weapon3': '2.058', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:02:59,442][63806] DAMAGECOUNT value on done: 12333.0 +[2023-09-14 15:02:59,779][63806] DAMAGECOUNT value on done: 12721.0 +[2023-09-14 15:02:59,779][63806] Sum rewards: -3.862, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.161', 'AMMO5': '0.005', 'AMMO2': '0.009', 'weapon5': '0.020', 'AMMO4': '0.045', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'ARMOR': '0.132', 'AMMO3': '0.140', 'HITCOUNT': '0.260', 'weapon4': '0.348', 'DAMAGECOUNT': '0.780', 'WEAPON3': '0.950', 'weapon2': '1.344', 'weapon3': '1.816', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:00,429][63733] Updated weights for policy 1, policy_version 2220 (0.0011) +[2023-09-14 15:03:02,537][63767] DAMAGECOUNT value on done: 14518.0 +[2023-09-14 15:03:02,537][63767] Sum rewards: -1.573, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.729', 'AMMO2': '0.001', 'AMMO5': '0.005', 'AMMO4': '0.005', 'WEAPON1': '0.020', 'weapon4': '0.026', 'weapon5': '0.040', 'WEAPON4': '0.050', 'HITCOUNT': '0.070', 'ARMOR': '0.077', 'WEAPON5': '0.100', 'AMMO3': '0.105', 'DAMAGECOUNT': '0.210', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.262', 'weapon2': '1.534'} +[2023-09-14 15:03:02,653][63735] DAMAGECOUNT value on done: 11633.0 +[2023-09-14 15:03:02,653][63735] Sum rewards: -0.473, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.770', 'AMMO2': '0.012', 'AMMO4': '0.061', 'ARMOR': '0.116', 'AMMO3': '0.119', 'WEAPON4': '0.150', 'HITCOUNT': '0.200', 'weapon4': '0.388', 'DAMAGECOUNT': '0.621', 'WEAPON3': '0.700', 'weapon3': '1.252', 'weapon2': '1.428', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:02,838][63767] DAMAGECOUNT value on done: 13929.0 +[2023-09-14 15:03:02,838][63767] Sum rewards: -0.701, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.007', 'AMMO2': '0.009', 'WEAPON1': '0.010', 'weapon5': '0.038', 'AMMO4': '0.046', 'weapon4': '0.078', 'WEAPON4': '0.100', 'weapon7': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.115', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON5': '0.150', 'WEAPON7': '0.200', 'HEALTH': '0.264', 'ARMOR': '0.400', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon3': '1.450', 'weapon2': '1.546'} +[2023-09-14 15:03:02,997][63732] Updated weights for policy 0, policy_version 2120 (0.0010) +[2023-09-14 15:03:03,064][63735] DAMAGECOUNT value on done: 15791.0 +[2023-09-14 15:03:03,064][63735] Sum rewards: -1.221, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.054', 'AMMO5': '0.013', 'AMMO2': '0.017', 'ARMOR': '0.044', 'weapon5': '0.070', 'AMMO4': '0.082', 'WEAPON4': '0.100', 'AMMO3': '0.151', 'WEAPON5': '0.200', 'weapon4': '0.234', 'HITCOUNT': '0.330', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.470', 'weapon3': '1.672', 'weapon2': '1.700', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:03:04,205][63771] DAMAGECOUNT value on done: 13233.0 +[2023-09-14 15:03:04,205][63771] Sum rewards: -2.580, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.849', 'AMMO4': '-0.024', 'AMMO2': '-0.005', 'FRAGCOUNT': '0.000', 'AMMO5': '0.019', 'AMMO3': '0.103', 'weapon5': '0.172', 'HITCOUNT': '0.310', 'WEAPON5': '0.350', 'WEAPON3': '0.500', 'ARMOR': '0.532', 'DAMAGECOUNT': '1.143', 'weapon2': '1.588', 'weapon3': '1.830'} +[2023-09-14 15:03:04,669][63771] DAMAGECOUNT value on done: 10399.0 +[2023-09-14 15:03:04,670][63771] Sum rewards: -3.080, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.815', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'AMMO5': '0.010', 'weapon5': '0.032', 'AMMO3': '0.139', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'ARMOR': '0.531', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.861', 'weapon2': '1.528', 'weapon3': '1.888', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:05,533][63733] Updated weights for policy 1, policy_version 2230 (0.0011) +[2023-09-14 15:03:05,740][63805] DAMAGECOUNT value on done: 13891.0 +[2023-09-14 15:03:06,125][63805] DAMAGECOUNT value on done: 11478.0 +[2023-09-14 15:03:06,125][63805] Sum rewards: -3.120, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.110', 'weapon4': '0.002', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'AMMO4': '0.084', 'WEAPON4': '0.100', 'weapon5': '0.104', 'AMMO3': '0.114', 'HITCOUNT': '0.290', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.969', 'weapon3': '1.512', 'weapon2': '1.742', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:07,242][63734] DAMAGECOUNT value on done: 12850.0 +[2023-09-14 15:03:07,243][63734] Sum rewards: -1.414, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.068', 'AMMO2': '0.004', 'AMMO4': '0.021', 'ARMOR': '0.040', 'AMMO3': '0.093', 'HITCOUNT': '0.200', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.846', 'weapon3': '1.648', 'weapon2': '1.702', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:07,667][63734] DAMAGECOUNT value on done: 12575.0 +[2023-09-14 15:03:07,668][63734] Sum rewards: 0.494, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-1.400', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.072', 'HITCOUNT': '0.080', 'AMMO3': '0.087', 'WEAPON4': '0.100', 'weapon4': '0.182', 'weapon5': '0.252', 'DAMAGECOUNT': '0.315', 'WEAPON5': '0.350', 'WEAPON3': '0.550', 'weapon3': '0.938', 'weapon2': '1.460', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:09,740][63770] DAMAGECOUNT value on done: 14918.0 +[2023-09-14 15:03:09,740][63770] Sum rewards: -5.115, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.631', 'weapon4': '0.002', 'AMMO2': '0.011', 'AMMO5': '0.017', 'ARMOR': '0.040', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'AMMO4': '0.056', 'AMMO3': '0.167', 'HITCOUNT': '0.170', 'weapon5': '0.214', 'WEAPON5': '0.250', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.660', 'WEAPON3': '1.000', 'weapon2': '1.024', 'weapon3': '2.064'} +[2023-09-14 15:03:10,069][63770] DAMAGECOUNT value on done: 11697.0 +[2023-09-14 15:03:10,070][63770] Sum rewards: 0.471, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.748', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'AMMO5': '0.014', 'weapon5': '0.090', 'WEAPON5': '0.100', 'ARMOR': '0.108', 'AMMO3': '0.158', 'WEAPON4': '0.200', 'weapon4': '0.216', 'HITCOUNT': '0.250', 'WEAPON3': '0.900', 'weapon2': '1.156', 'DAMAGECOUNT': '1.587', 'weapon3': '2.192', 'FRAGCOUNT': '3.500'} +[2023-09-14 15:03:10,724][63733] Updated weights for policy 1, policy_version 2240 (0.0010) +[2023-09-14 15:03:11,854][63767] DAMAGECOUNT value on done: 15191.0 +[2023-09-14 15:03:11,855][63767] Sum rewards: -1.637, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.577', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'ARMOR': '0.032', 'weapon5': '0.070', 'weapon7': '0.078', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.170', 'HITCOUNT': '0.210', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.840', 'weapon2': '1.552', 'weapon3': '1.638', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:03:12,222][63767] DAMAGECOUNT value on done: 17592.0 +[2023-09-14 15:03:12,223][63767] Sum rewards: -5.589, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.459', 'AMMO2': '0.000', 'AMMO4': '0.002', 'AMMO5': '0.003', 'ARMOR': '0.020', 'WEAPON5': '0.050', 'weapon5': '0.074', 'HITCOUNT': '0.150', 'AMMO3': '0.162', 'DAMAGECOUNT': '0.537', 'WEAPON3': '1.050', 'weapon2': '1.260', 'FRAGCOUNT': '2.000', 'weapon3': '2.062'} +[2023-09-14 15:03:14,566][63771] DAMAGECOUNT value on done: 11912.0 +[2023-09-14 15:03:14,567][63771] Sum rewards: -6.116, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.414', 'AMMO2': '0.005', 'WEAPON1': '0.010', 'AMMO5': '0.018', 'AMMO4': '0.024', 'ARMOR': '0.032', 'weapon4': '0.046', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'weapon5': '0.280', 'DAMAGECOUNT': '0.402', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.214', 'weapon2': '1.846'} +[2023-09-14 15:03:14,985][63771] DAMAGECOUNT value on done: 14712.0 +[2023-09-14 15:03:14,985][63771] Sum rewards: -4.153, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.758', 'AMMO5': '0.005', 'weapon5': '0.006', 'AMMO2': '0.010', 'AMMO4': '0.050', 'ARMOR': '0.068', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'weapon4': '0.124', 'AMMO3': '0.141', 'HITCOUNT': '0.170', 'DAMAGECOUNT': '0.546', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.434', 'weapon3': '1.750'} +[2023-09-14 15:03:15,871][63733] Updated weights for policy 1, policy_version 2250 (0.0011) +[2023-09-14 15:03:15,881][63732] Updated weights for policy 0, policy_version 2130 (0.0011) +[2023-09-14 15:03:17,280][63770] DAMAGECOUNT value on done: 11287.0 +[2023-09-14 15:03:17,281][63770] Sum rewards: -0.578, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.245', 'AMMO2': '0.007', 'AMMO5': '0.013', 'AMMO4': '0.035', 'WEAPON1': '0.050', 'ARMOR': '0.100', 'AMMO3': '0.106', 'HITCOUNT': '0.170', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.570', 'weapon5': '0.634', 'WEAPON3': '0.700', 'weapon2': '1.086', 'weapon3': '1.696', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:17,564][63769] DAMAGECOUNT value on done: 13879.0 +[2023-09-14 15:03:17,565][63769] Sum rewards: 1.929, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.398', 'AMMO5': '0.015', 'AMMO2': '0.018', 'ARMOR': '0.020', 'weapon7': '0.026', 'WEAPON1': '0.040', 'weapon5': '0.070', 'AMMO4': '0.089', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.120', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'weapon4': '0.312', 'HITCOUNT': '0.370', 'WEAPON3': '0.700', 'weapon2': '1.084', 'DAMAGECOUNT': '1.515', 'weapon3': '1.948', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:03:17,683][63770] DAMAGECOUNT value on done: 13891.0 +[2023-09-14 15:03:17,957][63769] DAMAGECOUNT value on done: 12175.0 +[2023-09-14 15:03:17,958][63769] Sum rewards: -3.773, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.690', 'AMMO4': '-0.026', 'AMMO2': '-0.005', 'AMMO5': '0.005', 'weapon5': '0.006', 'WEAPON1': '0.050', 'HITCOUNT': '0.090', 'AMMO3': '0.093', 'WEAPON5': '0.100', 'DAMAGECOUNT': '0.240', 'ARMOR': '0.456', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon3': '1.730', 'weapon2': '1.828'} +[2023-09-14 15:03:17,968][63805] DAMAGECOUNT value on done: 14726.0 +[2023-09-14 15:03:17,969][63805] Sum rewards: -5.343, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.495', 'AMMO2': '0.009', 'AMMO5': '0.011', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'AMMO4': '0.044', 'WEAPON4': '0.050', 'weapon5': '0.058', 'HITCOUNT': '0.160', 'AMMO3': '0.166', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.672', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.432', 'weapon3': '1.894'} +[2023-09-14 15:03:18,204][63734] DAMAGECOUNT value on done: 15323.0 +[2023-09-14 15:03:18,205][63734] Sum rewards: 2.684, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.156', 'AMMO5': '0.007', 'AMMO2': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.048', 'ARMOR': '0.064', 'WEAPON4': '0.100', 'AMMO3': '0.103', 'WEAPON5': '0.150', 'weapon4': '0.194', 'HITCOUNT': '0.210', 'weapon5': '0.250', 'WEAPON3': '0.500', 'DAMAGECOUNT': '1.440', 'weapon2': '1.494', 'weapon3': '1.510', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:18,340][63805] DAMAGECOUNT value on done: 15963.0 +[2023-09-14 15:03:18,340][63805] Sum rewards: -3.700, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.955', 'ARMOR': '0.012', 'AMMO2': '0.012', 'AMMO5': '0.013', 'WEAPON1': '0.040', 'AMMO4': '0.061', 'weapon4': '0.102', 'AMMO3': '0.127', 'HITCOUNT': '0.160', 'WEAPON4': '0.200', 'WEAPON6': '0.200', 'AMMO6': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.250', 'weapon5': '0.256', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon3': '1.448', 'weapon2': '1.524'} +[2023-09-14 15:03:18,587][63734] DAMAGECOUNT value on done: 12965.0 +[2023-09-14 15:03:19,664][63806] DAMAGECOUNT value on done: 12759.0 +[2023-09-14 15:03:19,664][63806] Sum rewards: -2.251, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.954', 'weapon4': '0.002', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.013', 'ARMOR': '0.040', 'AMMO4': '0.065', 'WEAPON4': '0.100', 'AMMO3': '0.180', 'WEAPON5': '0.200', 'HITCOUNT': '0.230', 'DAMAGECOUNT': '0.870', 'WEAPON3': '1.050', 'weapon2': '1.764', 'weapon3': '1.920', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:03:20,037][63806] DAMAGECOUNT value on done: 13107.0 +[2023-09-14 15:03:20,038][63806] Sum rewards: 0.978, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.247', 'AMMO5': '0.006', 'AMMO2': '0.017', 'ARMOR': '0.024', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'weapon4': '0.050', 'weapon5': '0.066', 'AMMO4': '0.084', 'AMMO3': '0.097', 'WEAPON5': '0.150', 'HITCOUNT': '0.250', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.035', 'weapon2': '1.382', 'weapon3': '1.774', 'FRAGCOUNT': '2.500'} +[2023-09-14 15:03:20,926][63733] Updated weights for policy 1, policy_version 2260 (0.0010) +[2023-09-14 15:03:21,039][63769] DAMAGECOUNT value on done: 14927.0 +[2023-09-14 15:03:21,039][63769] Sum rewards: -0.463, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.434', 'AMMO2': '0.013', 'AMMO5': '0.014', 'AMMO4': '0.065', 'weapon7': '0.084', 'AMMO3': '0.098', 'HITCOUNT': '0.160', 'weapon5': '0.168', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'AMMO6': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.250', 'weapon4': '0.354', 'ARMOR': '0.486', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.702', 'weapon2': '1.114', 'weapon3': '1.412', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:21,381][63769] DAMAGECOUNT value on done: 10756.0 +[2023-09-14 15:03:21,382][63769] Sum rewards: 0.802, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.092', 'AMMO5': '0.007', 'AMMO2': '0.016', 'AMMO4': '0.078', 'WEAPON5': '0.100', 'weapon5': '0.104', 'AMMO3': '0.113', 'WEAPON4': '0.150', 'HITCOUNT': '0.210', 'weapon4': '0.228', 'ARMOR': '0.538', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.074', 'weapon2': '1.566', 'weapon3': '1.710', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:22,724][63735] DAMAGECOUNT value on done: 14148.0 +[2023-09-14 15:03:22,724][63735] Sum rewards: -8.759, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-3.508', 'AMMO4': '-0.075', 'AMMO2': '-0.015', 'AMMO5': '0.005', 'weapon5': '0.028', 'ARMOR': '0.036', 'WEAPON5': '0.100', 'AMMO3': '0.178', 'HITCOUNT': '0.260', 'DAMAGECOUNT': '0.810', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.598', 'weapon3': '1.824'} +[2023-09-14 15:03:23,100][63735] DAMAGECOUNT value on done: 10278.0 +[2023-09-14 15:03:23,101][63735] Sum rewards: -5.325, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.557', 'weapon4': '0.008', 'AMMO2': '0.012', 'AMMO5': '0.015', 'weapon5': '0.018', 'WEAPON1': '0.050', 'AMMO4': '0.059', 'ARMOR': '0.066', 'AMMO3': '0.120', 'WEAPON4': '0.150', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.762', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.330', 'weapon3': '1.872'} +[2023-09-14 15:03:23,978][63806] DAMAGECOUNT value on done: 12610.0 +[2023-09-14 15:03:23,979][63806] Sum rewards: -1.307, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.807', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'AMMO5': '0.005', 'weapon5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.084', 'WEAPON5': '0.100', 'AMMO3': '0.129', 'HITCOUNT': '0.270', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.831', 'FRAGCOUNT': '1.000', 'weapon2': '1.414', 'weapon3': '1.686'} +[2023-09-14 15:03:24,355][63806] DAMAGECOUNT value on done: 13118.0 +[2023-09-14 15:03:24,356][63806] Sum rewards: 3.509, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.844', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.028', 'weapon5': '0.102', 'AMMO3': '0.139', 'WEAPON5': '0.300', 'HITCOUNT': '0.300', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.191', 'weapon3': '1.526', 'weapon2': '1.888', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:03:26,027][63733] Updated weights for policy 1, policy_version 2270 (0.0011) +[2023-09-14 15:03:26,358][63767] DAMAGECOUNT value on done: 14888.0 +[2023-09-14 15:03:26,358][63767] Sum rewards: -4.512, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.855', 'weapon5': '0.002', 'AMMO2': '0.007', 'WEAPON1': '0.020', 'AMMO5': '0.020', 'AMMO4': '0.036', 'ARMOR': '0.060', 'AMMO3': '0.182', 'weapon4': '0.196', 'WEAPON4': '0.250', 'HITCOUNT': '0.280', 'WEAPON5': '0.300', 'WEAPON3': '1.050', 'DAMAGECOUNT': '1.110', 'weapon3': '1.610', 'weapon2': '1.720', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:26,769][63767] DAMAGECOUNT value on done: 14404.0 +[2023-09-14 15:03:26,769][63767] Sum rewards: -0.241, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.870', 'AMMO5': '0.012', 'AMMO2': '0.022', 'ARMOR': '0.028', 'WEAPON1': '0.030', 'weapon4': '0.030', 'WEAPON4': '0.100', 'AMMO3': '0.103', 'AMMO4': '0.108', 'WEAPON5': '0.200', 'HITCOUNT': '0.260', 'weapon5': '0.352', 'WEAPON3': '0.550', 'weapon3': '1.262', 'DAMAGECOUNT': '1.425', 'weapon2': '1.646', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:27,116][63735] DAMAGECOUNT value on done: 11868.0 +[2023-09-14 15:03:27,116][63735] Sum rewards: -1.839, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.810', 'AMMO2': '0.009', 'AMMO5': '0.014', 'WEAPON1': '0.030', 'AMMO4': '0.043', 'weapon5': '0.092', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'ARMOR': '0.108', 'weapon4': '0.156', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.705', 'FRAGCOUNT': '1.000', 'weapon3': '1.340', 'weapon2': '1.756'} +[2023-09-14 15:03:27,528][63735] DAMAGECOUNT value on done: 16047.0 +[2023-09-14 15:03:27,529][63735] Sum rewards: 0.113, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.444', 'AMMO2': '0.009', 'AMMO5': '0.012', 'AMMO4': '0.046', 'ARMOR': '0.052', 'weapon7': '0.076', 'weapon5': '0.098', 'WEAPON5': '0.100', 'AMMO3': '0.139', 'WEAPON4': '0.150', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'HITCOUNT': '0.230', 'weapon4': '0.286', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.768', 'weapon2': '1.050', 'weapon3': '1.870', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:28,274][63732] Updated weights for policy 0, policy_version 2140 (0.0012) +[2023-09-14 15:03:29,436][63805] DAMAGECOUNT value on done: 14130.0 +[2023-09-14 15:03:29,436][63805] Sum rewards: 1.013, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.820', 'AMMO5': '0.010', 'AMMO2': '0.033', 'weapon4': '0.048', 'WEAPON1': '0.060', 'AMMO3': '0.123', 'WEAPON4': '0.150', 'AMMO4': '0.166', 'WEAPON5': '0.200', 'HITCOUNT': '0.220', 'weapon5': '0.492', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.717', 'weapon2': '1.352', 'weapon3': '1.562', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:29,474][63771] DAMAGECOUNT value on done: 13656.0 +[2023-09-14 15:03:29,475][63771] Sum rewards: -0.439, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.086', 'AMMO5': '0.017', 'AMMO2': '0.028', 'weapon7': '0.030', 'weapon4': '0.066', 'WEAPON4': '0.100', 'AMMO3': '0.132', 'AMMO4': '0.141', 'AMMO6': '0.160', 'AMMO7': '0.160', 'weapon5': '0.192', 'WEAPON7': '0.200', 'HITCOUNT': '0.210', 'WEAPON5': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '1.269', 'weapon2': '1.588', 'weapon3': '1.804', 'FRAGCOUNT': '2.500'} +[2023-09-14 15:03:29,783][63805] DAMAGECOUNT value on done: 11933.0 +[2023-09-14 15:03:29,783][63805] Sum rewards: -1.258, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.216', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'weapon5': '0.048', 'AMMO4': '0.086', 'WEAPON4': '0.100', 'weapon4': '0.120', 'WEAPON5': '0.150', 'AMMO3': '0.156', 'HITCOUNT': '0.300', 'WEAPON3': '0.900', 'weapon2': '1.226', 'DAMAGECOUNT': '1.365', 'weapon3': '2.222', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:03:29,829][63771] DAMAGECOUNT value on done: 10464.0 +[2023-09-14 15:03:29,830][63771] Sum rewards: -3.459, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.162', 'AMMO5': '0.003', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'ARMOR': '0.020', 'AMMO4': '0.038', 'weapon5': '0.040', 'WEAPON5': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.149', 'DAMAGECOUNT': '0.195', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.662', 'weapon3': '1.668'} +[2023-09-14 15:03:31,452][63734] DAMAGECOUNT value on done: 12980.0 +[2023-09-14 15:03:31,528][63733] Updated weights for policy 1, policy_version 2280 (0.0010) +[2023-09-14 15:03:31,823][63734] DAMAGECOUNT value on done: 12959.0 +[2023-09-14 15:03:31,823][63734] Sum rewards: -0.768, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.560', 'AMMO5': '0.003', 'AMMO2': '0.007', 'AMMO4': '0.033', 'WEAPON1': '0.040', 'WEAPON5': '0.050', 'AMMO3': '0.141', 'weapon5': '0.142', 'HITCOUNT': '0.360', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.152', 'weapon2': '1.518', 'weapon3': '1.796', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:34,831][63770] DAMAGECOUNT value on done: 15027.0 +[2023-09-14 15:03:35,182][63770] DAMAGECOUNT value on done: 12050.0 +[2023-09-14 15:03:35,182][63770] Sum rewards: -1.785, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.716', 'AMMO5': '0.005', 'ARMOR': '0.012', 'AMMO2': '0.031', 'AMMO3': '0.115', 'weapon5': '0.142', 'AMMO4': '0.155', 'WEAPON5': '0.200', 'HITCOUNT': '0.280', 'WEAPON4': '0.450', 'weapon4': '0.634', 'WEAPON3': '0.650', 'weapon2': '1.020', 'DAMAGECOUNT': '1.059', 'weapon3': '1.428', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:35,432][63767] DAMAGECOUNT value on done: 15358.0 +[2023-09-14 15:03:35,433][63767] Sum rewards: -3.272, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.262', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO2': '0.024', 'ARMOR': '0.060', 'weapon4': '0.086', 'AMMO4': '0.121', 'AMMO3': '0.130', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'DAMAGECOUNT': '0.501', 'WEAPON3': '0.750', 'weapon5': '0.758', 'weapon3': '1.150', 'weapon2': '1.550', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:35,770][63767] DAMAGECOUNT value on done: 17822.0 +[2023-09-14 15:03:35,770][63767] Sum rewards: 1.850, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.236', 'AMMO5': '0.018', 'WEAPON1': '0.030', 'AMMO2': '0.035', 'weapon4': '0.106', 'AMMO3': '0.107', 'AMMO4': '0.173', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'WEAPON5': '0.350', 'weapon5': '0.484', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.690', 'weapon3': '1.108', 'weapon2': '1.966', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:03:37,022][63733] Updated weights for policy 1, policy_version 2290 (0.0010) +[2023-09-14 15:03:38,387][63732] Updated weights for policy 0, policy_version 2150 (0.0011) +[2023-09-14 15:03:38,580][63771] DAMAGECOUNT value on done: 11946.0 +[2023-09-14 15:03:38,968][63771] DAMAGECOUNT value on done: 14800.0 +[2023-09-14 15:03:38,968][63771] Sum rewards: -0.162, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.012', 'AMMO2': '0.016', 'ARMOR': '0.045', 'WEAPON1': '0.060', 'AMMO3': '0.070', 'AMMO4': '0.080', 'HEALTH': '0.084', 'HITCOUNT': '0.100', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.264', 'WEAPON3': '0.350', 'weapon5': '0.476', 'FRAGCOUNT': '1.000', 'weapon3': '1.420', 'weapon2': '1.610'} +[2023-09-14 15:03:40,604][63734] DAMAGECOUNT value on done: 15627.0 +[2023-09-14 15:03:40,604][63734] Sum rewards: 0.577, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.029', 'AMMO2': '0.010', 'AMMO5': '0.012', 'AMMO4': '0.050', 'ARMOR': '0.088', 'weapon5': '0.090', 'AMMO3': '0.105', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'weapon4': '0.218', 'HITCOUNT': '0.230', 'WEAPON3': '0.700', 'weapon2': '0.904', 'DAMAGECOUNT': '0.912', 'weapon3': '1.886', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:40,944][63734] DAMAGECOUNT value on done: 13449.0 +[2023-09-14 15:03:40,944][63734] Sum rewards: 1.229, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.132', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'weapon5': '0.016', 'AMMO2': '0.025', 'AMMO4': '0.123', 'AMMO3': '0.134', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'HITCOUNT': '0.450', 'ARMOR': '0.517', 'WEAPON3': '0.700', 'weapon4': '0.738', 'weapon2': '1.072', 'DAMAGECOUNT': '1.452', 'weapon3': '1.614', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:03:41,160][63805] DAMAGECOUNT value on done: 14976.0 +[2023-09-14 15:03:41,328][63770] DAMAGECOUNT value on done: 11802.0 +[2023-09-14 15:03:41,329][63770] Sum rewards: 1.330, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.752', 'AMMO2': '0.001', 'AMMO4': '0.006', 'AMMO5': '0.025', 'WEAPON1': '0.060', 'WEAPON4': '0.100', 'AMMO3': '0.109', 'weapon5': '0.168', 'weapon4': '0.206', 'HITCOUNT': '0.350', 'WEAPON5': '0.400', 'WEAPON3': '0.750', 'weapon2': '1.090', 'DAMAGECOUNT': '1.545', 'FRAGCOUNT': '2.000', 'weapon3': '2.022'} +[2023-09-14 15:03:41,500][63805] DAMAGECOUNT value on done: 16060.0 +[2023-09-14 15:03:41,500][63805] Sum rewards: -1.635, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.048', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.026', 'weapon5': '0.028', 'ARMOR': '0.096', 'HITCOUNT': '0.110', 'AMMO4': '0.129', 'AMMO3': '0.141', 'WEAPON5': '0.150', 'weapon4': '0.276', 'DAMAGECOUNT': '0.291', 'WEAPON4': '0.300', 'WEAPON3': '0.700', 'weapon3': '1.334', 'weapon2': '1.814', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:03:41,715][63770] DAMAGECOUNT value on done: 14034.0 +[2023-09-14 15:03:41,716][63770] Sum rewards: -5.341, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.576', 'AMMO5': '0.007', 'AMMO2': '0.015', 'AMMO4': '0.073', 'weapon7': '0.094', 'ARMOR': '0.099', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.114', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.150', 'weapon5': '0.182', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.429', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.516', 'weapon3': '1.716'} +[2023-09-14 15:03:42,511][63769] DAMAGECOUNT value on done: 14059.0 +[2023-09-14 15:03:42,511][63769] Sum rewards: -2.140, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.762', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.022', 'AMMO3': '0.060', 'weapon7': '0.060', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon5': '0.108', 'AMMO4': '0.110', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'WEAPON3': '0.400', 'weapon4': '0.414', 'DAMAGECOUNT': '0.540', 'FRAGCOUNT': '1.000', 'weapon3': '1.246', 'weapon2': '1.284'} +[2023-09-14 15:03:42,812][63733] Updated weights for policy 1, policy_version 2300 (0.0013) +[2023-09-14 15:03:42,903][63806] DAMAGECOUNT value on done: 12804.0 +[2023-09-14 15:03:42,907][63769] DAMAGECOUNT value on done: 12365.0 +[2023-09-14 15:03:42,908][63769] Sum rewards: 0.406, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.007', 'AMMO2': '0.017', 'WEAPON1': '0.030', 'AMMO4': '0.085', 'AMMO3': '0.090', 'WEAPON5': '0.150', 'HITCOUNT': '0.200', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.570', 'weapon5': '0.620', 'HEALTH': '0.842', 'weapon3': '1.250', 'weapon2': '1.644', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:43,213][63806] DAMAGECOUNT value on done: 13337.0 +[2023-09-14 15:03:43,213][63806] Sum rewards: -1.398, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.290', 'AMMO2': '0.014', 'AMMO5': '0.015', 'WEAPON1': '0.070', 'AMMO4': '0.071', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'weapon4': '0.176', 'HITCOUNT': '0.190', 'WEAPON5': '0.300', 'weapon5': '0.362', 'DAMAGECOUNT': '0.690', 'WEAPON3': '0.700', 'weapon2': '1.422', 'weapon3': '1.670', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:03:43,485][63769] DAMAGECOUNT value on done: 15277.0 +[2023-09-14 15:03:43,485][63769] Sum rewards: -0.971, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.860', 'AMMO5': '0.010', 'AMMO2': '0.022', 'WEAPON1': '0.030', 'weapon5': '0.056', 'weapon7': '0.068', 'ARMOR': '0.080', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO4': '0.109', 'AMMO3': '0.136', 'HITCOUNT': '0.240', 'WEAPON4': '0.250', 'weapon4': '0.268', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.050', 'weapon3': '1.376', 'weapon2': '1.394', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:03:43,814][63769] DAMAGECOUNT value on done: 11053.0 +[2023-09-14 15:03:43,815][63769] Sum rewards: -2.982, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.400', 'AMMO5': '0.007', 'AMMO2': '0.021', 'WEAPON1': '0.030', 'ARMOR': '0.032', 'weapon5': '0.038', 'AMMO4': '0.107', 'AMMO3': '0.146', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.210', 'weapon4': '0.334', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.891', 'weapon2': '1.580', 'weapon3': '1.622'} +[2023-09-14 15:03:45,928][63735] DAMAGECOUNT value on done: 14389.0 +[2023-09-14 15:03:45,929][63735] Sum rewards: -2.712, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.347', 'AMMO4': '-0.060', 'AMMO2': '-0.012', 'ARMOR': '0.008', 'AMMO5': '0.010', 'WEAPON1': '0.050', 'AMMO3': '0.079', 'HITCOUNT': '0.160', 'WEAPON5': '0.250', 'weapon5': '0.272', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.723', 'FRAGCOUNT': '1.000', 'weapon3': '1.418', 'weapon2': '1.636'} +[2023-09-14 15:03:46,292][63735] DAMAGECOUNT value on done: 10613.0 +[2023-09-14 15:03:46,293][63735] Sum rewards: -0.941, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.674', 'AMMO5': '0.005', 'weapon5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.012', 'weapon4': '0.024', 'WEAPON5': '0.050', 'AMMO4': '0.059', 'AMMO3': '0.146', 'WEAPON4': '0.150', 'HITCOUNT': '0.270', 'ARMOR': '0.532', 'WEAPON3': '0.900', 'weapon2': '0.926', 'DAMAGECOUNT': '1.005', 'FRAGCOUNT': '2.000', 'weapon3': '2.634'} +[2023-09-14 15:03:47,920][63732] Updated weights for policy 0, policy_version 2160 (0.0010) +[2023-09-14 15:03:48,502][63806] DAMAGECOUNT value on done: 12730.0 +[2023-09-14 15:03:48,604][63767] DAMAGECOUNT value on done: 15307.0 +[2023-09-14 15:03:48,604][63767] Sum rewards: 1.038, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.736', 'AMMO5': '0.015', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'AMMO4': '0.091', 'weapon7': '0.098', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.128', 'weapon5': '0.174', 'weapon4': '0.194', 'HITCOUNT': '0.200', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'WEAPON5': '0.300', 'WEAPON3': '0.650', 'weapon2': '1.116', 'DAMAGECOUNT': '1.257', 'weapon3': '1.598', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:48,656][63733] Updated weights for policy 1, policy_version 2310 (0.0010) +[2023-09-14 15:03:48,943][63806] DAMAGECOUNT value on done: 13442.0 +[2023-09-14 15:03:48,943][63806] Sum rewards: -1.920, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.370', 'weapon4': '0.002', 'AMMO5': '0.016', 'AMMO2': '0.021', 'WEAPON1': '0.040', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'AMMO4': '0.103', 'HITCOUNT': '0.170', 'AMMO3': '0.181', 'weapon5': '0.206', 'WEAPON5': '0.350', 'weapon2': '0.790', 'WEAPON3': '0.950', 'DAMAGECOUNT': '0.972', 'FRAGCOUNT': '2.000', 'weapon3': '2.308'} +[2023-09-14 15:03:48,983][63767] DAMAGECOUNT value on done: 14839.0 +[2023-09-14 15:03:48,984][63767] Sum rewards: -1.442, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.958', 'AMMO5': '0.005', 'AMMO2': '0.014', 'weapon5': '0.020', 'ARMOR': '0.036', 'weapon7': '0.062', 'AMMO4': '0.069', 'WEAPON5': '0.100', 'AMMO3': '0.113', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.150', 'weapon4': '0.160', 'WEAPON7': '0.200', 'HITCOUNT': '0.250', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.305', 'weapon2': '1.510', 'weapon3': '1.682', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:51,428][63735] DAMAGECOUNT value on done: 11978.0 +[2023-09-14 15:03:51,905][63735] DAMAGECOUNT value on done: 16262.0 +[2023-09-14 15:03:51,906][63735] Sum rewards: -4.967, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.383', 'AMMO5': '0.013', 'AMMO2': '0.029', 'WEAPON1': '0.030', 'ARMOR': '0.044', 'weapon5': '0.072', 'AMMO4': '0.144', 'AMMO3': '0.176', 'HITCOUNT': '0.210', 'WEAPON5': '0.250', 'weapon4': '0.262', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.645', 'WEAPON3': '1.100', 'weapon2': '1.456', 'weapon3': '1.686', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:03:52,490][63805] DAMAGECOUNT value on done: 14330.0 +[2023-09-14 15:03:52,491][63805] Sum rewards: 0.288, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.468', 'AMMO4': '-0.006', 'AMMO2': '-0.001', 'AMMO5': '0.013', 'WEAPON1': '0.030', 'ARMOR': '0.070', 'AMMO3': '0.101', 'HITCOUNT': '0.140', 'WEAPON5': '0.250', 'weapon5': '0.512', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.650', 'weapon3': '1.292', 'weapon2': '1.606', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:03:52,883][63805] DAMAGECOUNT value on done: 12312.0 +[2023-09-14 15:03:52,883][63805] Sum rewards: -2.499, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.606', 'AMMO5': '0.015', 'AMMO2': '0.017', 'weapon5': '0.040', 'WEAPON1': '0.050', 'ARMOR': '0.077', 'AMMO4': '0.084', 'WEAPON4': '0.100', 'AMMO3': '0.129', 'weapon4': '0.142', 'WEAPON5': '0.250', 'HITCOUNT': '0.330', 'WEAPON3': '0.900', 'weapon2': '1.034', 'DAMAGECOUNT': '1.137', 'FRAGCOUNT': '2.000', 'weapon3': '2.302'} +[2023-09-14 15:03:54,416][63771] DAMAGECOUNT value on done: 13933.0 +[2023-09-14 15:03:54,417][63771] Sum rewards: -3.809, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.435', 'WEAPON1': '0.010', 'weapon5': '0.014', 'AMMO5': '0.018', 'AMMO2': '0.029', 'ARMOR': '0.116', 'AMMO4': '0.142', 'AMMO3': '0.161', 'WEAPON4': '0.200', 'HITCOUNT': '0.220', 'WEAPON5': '0.350', 'weapon4': '0.414', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.831', 'weapon2': '1.104', 'weapon3': '1.818', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:54,488][63733] Updated weights for policy 1, policy_version 2320 (0.0012) +[2023-09-14 15:03:54,845][63771] DAMAGECOUNT value on done: 10804.0 +[2023-09-14 15:03:54,845][63771] Sum rewards: 2.787, reward structure: {'DEATHCOUNT': '-4.500', 'ARMOR': '0.004', 'AMMO5': '0.005', 'AMMO2': '0.007', 'weapon5': '0.022', 'AMMO4': '0.032', 'WEAPON1': '0.050', 'AMMO3': '0.057', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'weapon7': '0.134', 'HITCOUNT': '0.230', 'WEAPON3': '0.300', 'HEALTH': '0.426', 'weapon3': '0.928', 'DAMAGECOUNT': '1.020', 'weapon2': '1.672', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:03:55,271][63734] DAMAGECOUNT value on done: 13214.0 +[2023-09-14 15:03:55,271][63734] Sum rewards: -2.472, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.582', 'AMMO2': '0.000', 'AMMO4': '0.001', 'AMMO5': '0.024', 'WEAPON1': '0.080', 'AMMO3': '0.121', 'HITCOUNT': '0.150', 'weapon5': '0.384', 'WEAPON5': '0.500', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.702', 'weapon2': '1.334', 'weapon3': '1.914'} +[2023-09-14 15:03:55,655][63734] DAMAGECOUNT value on done: 12999.0 +[2023-09-14 15:03:57,570][63732] Updated weights for policy 0, policy_version 2170 (0.0011) +[2023-09-14 15:03:59,806][63770] DAMAGECOUNT value on done: 15287.0 +[2023-09-14 15:03:59,806][63770] Sum rewards: 1.020, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.902', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'AMMO5': '0.005', 'WEAPON1': '0.060', 'AMMO3': '0.074', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.132', 'HITCOUNT': '0.190', 'ARMOR': '0.468', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.780', 'FRAGCOUNT': '1.000', 'weapon2': '1.326', 'weapon3': '1.688'} +[2023-09-14 15:03:59,984][63767] DAMAGECOUNT value on done: 15609.0 +[2023-09-14 15:03:59,984][63767] Sum rewards: -0.408, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.997', 'AMMO2': '0.009', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.047', 'WEAPON4': '0.050', 'weapon7': '0.076', 'ARMOR': '0.080', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.135', 'weapon4': '0.162', 'weapon5': '0.216', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.753', 'WEAPON3': '0.800', 'weapon2': '1.170', 'weapon3': '1.746', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:04:00,144][63770] DAMAGECOUNT value on done: 12360.0 +[2023-09-14 15:04:00,144][63770] Sum rewards: -1.718, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.667', 'AMMO5': '0.020', 'WEAPON1': '0.030', 'AMMO2': '0.037', 'ARMOR': '0.060', 'weapon5': '0.080', 'weapon4': '0.116', 'AMMO3': '0.143', 'WEAPON4': '0.150', 'AMMO4': '0.183', 'HITCOUNT': '0.250', 'WEAPON5': '0.350', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.930', 'FRAGCOUNT': '1.500', 'weapon2': '1.564', 'weapon3': '1.786'} +[2023-09-14 15:04:00,293][63733] Updated weights for policy 1, policy_version 2330 (0.0011) +[2023-09-14 15:04:00,416][63767] DAMAGECOUNT value on done: 18102.0 +[2023-09-14 15:04:00,416][63767] Sum rewards: 1.626, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.525', 'AMMO5': '0.033', 'AMMO2': '0.037', 'AMMO3': '0.083', 'WEAPON1': '0.090', 'HITCOUNT': '0.170', 'AMMO4': '0.182', 'ARMOR': '0.458', 'WEAPON5': '0.600', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.840', 'weapon2': '0.946', 'weapon5': '1.112', 'weapon3': '1.650', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:02,342][63771] DAMAGECOUNT value on done: 12496.0 +[2023-09-14 15:04:02,342][63771] Sum rewards: 2.868, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.523', 'weapon4': '0.006', 'AMMO5': '0.015', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'AMMO4': '0.089', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON4': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.104', 'ARMOR': '0.108', 'AMMO3': '0.109', 'weapon5': '0.116', 'WEAPON5': '0.250', 'HITCOUNT': '0.420', 'WEAPON3': '0.700', 'weapon2': '1.454', 'DAMAGECOUNT': '1.650', 'weapon3': '1.932', 'FRAGCOUNT': '3.500'} +[2023-09-14 15:04:02,738][63771] DAMAGECOUNT value on done: 15080.0 +[2023-09-14 15:04:02,739][63771] Sum rewards: -0.314, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.472', 'AMMO4': '-0.023', 'AMMO2': '-0.005', 'AMMO5': '0.013', 'WEAPON1': '0.050', 'ARMOR': '0.080', 'AMMO3': '0.119', 'weapon5': '0.166', 'HITCOUNT': '0.180', 'WEAPON5': '0.250', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.840', 'weapon2': '1.508', 'weapon3': '1.680', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:03,361][63734] DAMAGECOUNT value on done: 16037.0 +[2023-09-14 15:04:03,362][63734] Sum rewards: -2.596, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.948', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.026', 'weapon5': '0.046', 'ARMOR': '0.064', 'weapon7': '0.082', 'WEAPON5': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO4': '0.130', 'AMMO3': '0.131', 'WEAPON7': '0.200', 'WEAPON4': '0.250', 'HITCOUNT': '0.330', 'weapon4': '0.404', 'WEAPON3': '0.600', 'weapon2': '1.002', 'DAMAGECOUNT': '1.230', 'FRAGCOUNT': '1.500', 'weapon3': '1.752'} +[2023-09-14 15:04:03,701][63734] DAMAGECOUNT value on done: 13897.0 +[2023-09-14 15:04:03,701][63734] Sum rewards: -0.237, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.130', 'AMMO2': '0.003', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'ARMOR': '0.012', 'AMMO4': '0.013', 'WEAPON4': '0.050', 'weapon4': '0.050', 'weapon5': '0.072', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.142', 'WEAPON5': '0.250', 'HITCOUNT': '0.350', 'WEAPON3': '0.850', 'weapon2': '1.314', 'DAMAGECOUNT': '1.344', 'weapon3': '1.872', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:04:04,517][63805] DAMAGECOUNT value on done: 15090.0 +[2023-09-14 15:04:04,517][63805] Sum rewards: -2.298, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.478', 'AMMO2': '0.009', 'AMMO5': '0.012', 'WEAPON1': '0.040', 'AMMO4': '0.042', 'ARMOR': '0.056', 'weapon4': '0.104', 'HITCOUNT': '0.120', 'AMMO3': '0.137', 'WEAPON4': '0.150', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.342', 'WEAPON3': '0.800', 'weapon5': '0.934', 'FRAGCOUNT': '1.000', 'weapon3': '1.176', 'weapon2': '1.508'} +[2023-09-14 15:04:04,867][63805] DAMAGECOUNT value on done: 16191.0 +[2023-09-14 15:04:04,868][63805] Sum rewards: -0.981, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.071', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'AMMO5': '0.007', 'WEAPON1': '0.030', 'weapon7': '0.068', 'AMMO3': '0.079', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.224', 'DAMAGECOUNT': '0.393', 'ARMOR': '0.507', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon3': '1.366', 'weapon2': '1.758'} +[2023-09-14 15:04:05,008][63770] DAMAGECOUNT value on done: 12122.0 +[2023-09-14 15:04:05,009][63770] Sum rewards: 0.811, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.718', 'AMMO5': '0.010', 'AMMO2': '0.023', 'ARMOR': '0.024', 'WEAPON4': '0.050', 'weapon4': '0.066', 'AMMO3': '0.073', 'WEAPON1': '0.100', 'AMMO4': '0.113', 'HITCOUNT': '0.140', 'weapon5': '0.208', 'WEAPON5': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.960', 'weapon3': '1.470', 'weapon2': '1.492', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:04:05,354][63770] DAMAGECOUNT value on done: 14361.0 +[2023-09-14 15:04:05,355][63770] Sum rewards: -1.987, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.651', 'ARMOR': '0.004', 'weapon4': '0.008', 'AMMO5': '0.018', 'AMMO2': '0.022', 'WEAPON1': '0.070', 'WEAPON4': '0.100', 'AMMO4': '0.111', 'AMMO3': '0.134', 'HITCOUNT': '0.220', 'WEAPON5': '0.350', 'weapon5': '0.526', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.981', 'weapon2': '1.126', 'weapon3': '1.944', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:05,993][63769] DAMAGECOUNT value on done: 15742.0 +[2023-09-14 15:04:05,994][63769] Sum rewards: -0.540, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.540', 'AMMO2': '0.015', 'AMMO5': '0.019', 'WEAPON1': '0.020', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'AMMO4': '0.074', 'weapon4': '0.080', 'AMMO3': '0.111', 'HITCOUNT': '0.120', 'weapon5': '0.388', 'WEAPON5': '0.450', 'WEAPON3': '0.600', 'weapon2': '1.208', 'DAMAGECOUNT': '1.395', 'weapon3': '1.688', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:06,093][63733] Updated weights for policy 1, policy_version 2340 (0.0011) +[2023-09-14 15:04:06,354][63806] DAMAGECOUNT value on done: 13205.0 +[2023-09-14 15:04:06,355][63806] Sum rewards: 0.044, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.706', 'weapon4': '0.002', 'AMMO5': '0.007', 'AMMO2': '0.008', 'WEAPON1': '0.010', 'AMMO4': '0.037', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'AMMO3': '0.100', 'WEAPON5': '0.150', 'weapon5': '0.222', 'HITCOUNT': '0.340', 'WEAPON3': '0.550', 'DAMAGECOUNT': '1.203', 'weapon3': '1.324', 'weapon2': '1.956', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:06,363][63769] DAMAGECOUNT value on done: 11287.0 +[2023-09-14 15:04:06,364][63769] Sum rewards: -0.096, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.284', 'AMMO4': '-0.049', 'AMMO2': '-0.010', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'weapon7': '0.062', 'ARMOR': '0.068', 'AMMO3': '0.101', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon5': '0.140', 'WEAPON5': '0.150', 'WEAPON7': '0.200', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.702', 'WEAPON3': '0.750', 'weapon2': '1.468', 'weapon3': '1.880', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:04:06,729][63806] DAMAGECOUNT value on done: 13530.0 +[2023-09-14 15:04:06,729][63806] Sum rewards: 1.538, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO2': '0.022', 'AMMO5': '0.022', 'ARMOR': '0.040', 'weapon4': '0.040', 'WEAPON1': '0.060', 'AMMO3': '0.080', 'WEAPON4': '0.100', 'AMMO4': '0.109', 'HITCOUNT': '0.180', 'weapon5': '0.292', 'HEALTH': '0.314', 'WEAPON3': '0.450', 'WEAPON5': '0.450', 'DAMAGECOUNT': '0.579', 'weapon3': '1.452', 'weapon2': '1.848', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:07,081][63732] Updated weights for policy 0, policy_version 2180 (0.0011) +[2023-09-14 15:04:07,369][63769] DAMAGECOUNT value on done: 14594.0 +[2023-09-14 15:04:07,370][63769] Sum rewards: 0.477, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.410', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'AMMO3': '0.092', 'weapon7': '0.130', 'AMMO6': '0.220', 'AMMO7': '0.220', 'WEAPON7': '0.300', 'HITCOUNT': '0.310', 'ARMOR': '0.416', 'WEAPON3': '0.600', 'weapon3': '1.482', 'weapon2': '1.516', 'DAMAGECOUNT': '1.605', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:07,718][63769] DAMAGECOUNT value on done: 12758.0 +[2023-09-14 15:04:07,719][63769] Sum rewards: -2.666, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.596', 'AMMO2': '0.019', 'AMMO5': '0.027', 'ARMOR': '0.028', 'WEAPON1': '0.070', 'AMMO4': '0.094', 'WEAPON4': '0.100', 'weapon4': '0.112', 'AMMO3': '0.172', 'weapon5': '0.226', 'HITCOUNT': '0.340', 'WEAPON5': '0.400', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.179', 'weapon2': '1.618', 'weapon3': '1.646', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:04:09,229][63735] DAMAGECOUNT value on done: 14544.0 +[2023-09-14 15:04:09,230][63735] Sum rewards: -0.686, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.319', 'AMMO5': '0.005', 'AMMO2': '0.014', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.070', 'AMMO3': '0.082', 'WEAPON5': '0.100', 'HITCOUNT': '0.130', 'weapon5': '0.184', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.500', 'ARMOR': '0.552', 'FRAGCOUNT': '1.000', 'weapon2': '1.182', 'weapon3': '1.278'} +[2023-09-14 15:04:09,597][63735] DAMAGECOUNT value on done: 11075.0 +[2023-09-14 15:04:09,597][63735] Sum rewards: 1.311, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.514', 'AMMO5': '0.010', 'AMMO2': '0.014', 'weapon4': '0.044', 'WEAPON1': '0.060', 'AMMO4': '0.069', 'ARMOR': '0.076', 'AMMO3': '0.130', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'weapon5': '0.200', 'HITCOUNT': '0.310', 'WEAPON3': '0.700', 'weapon2': '1.216', 'DAMAGECOUNT': '1.386', 'weapon3': '1.760', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:11,165][63767] DAMAGECOUNT value on done: 15496.0 +[2023-09-14 15:04:11,166][63767] Sum rewards: -0.082, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.453', 'AMMO4': '-0.010', 'AMMO2': '-0.002', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO3': '0.074', 'weapon5': '0.104', 'HITCOUNT': '0.150', 'WEAPON5': '0.200', 'ARMOR': '0.532', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.567', 'weapon3': '1.414', 'weapon2': '1.514', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:11,552][63767] DAMAGECOUNT value on done: 15318.0 +[2023-09-14 15:04:11,553][63767] Sum rewards: -1.420, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.508', 'AMMO2': '0.004', 'AMMO5': '0.012', 'AMMO4': '0.022', 'ARMOR': '0.040', 'AMMO3': '0.162', 'weapon5': '0.168', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.300', 'HITCOUNT': '0.310', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.437', 'weapon2': '1.508', 'weapon3': '1.924'} +[2023-09-14 15:04:11,949][63733] Updated weights for policy 1, policy_version 2350 (0.0010) +[2023-09-14 15:04:12,919][63806] DAMAGECOUNT value on done: 12969.0 +[2023-09-14 15:04:13,358][63806] DAMAGECOUNT value on done: 13887.0 +[2023-09-14 15:04:13,358][63806] Sum rewards: -0.571, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.423', 'weapon5': '0.006', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.025', 'ARMOR': '0.088', 'AMMO4': '0.125', 'AMMO3': '0.128', 'WEAPON5': '0.150', 'weapon4': '0.222', 'WEAPON4': '0.300', 'HITCOUNT': '0.430', 'WEAPON3': '0.750', 'weapon2': '0.896', 'DAMAGECOUNT': '1.335', 'weapon3': '2.126', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:15,787][63805] DAMAGECOUNT value on done: 14479.0 +[2023-09-14 15:04:15,788][63805] Sum rewards: -1.814, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.970', 'AMMO2': '0.007', 'AMMO5': '0.015', 'AMMO4': '0.035', 'ARMOR': '0.040', 'WEAPON1': '0.050', 'HITCOUNT': '0.140', 'AMMO3': '0.147', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.447', 'WEAPON3': '0.700', 'weapon5': '0.804', 'FRAGCOUNT': '1.000', 'weapon3': '1.340', 'weapon2': '1.630'} +[2023-09-14 15:04:16,154][63735] DAMAGECOUNT value on done: 12158.0 +[2023-09-14 15:04:16,154][63735] Sum rewards: -3.204, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.636', 'AMMO2': '0.015', 'AMMO5': '0.018', 'ARMOR': '0.044', 'WEAPON1': '0.050', 'AMMO4': '0.073', 'AMMO3': '0.128', 'WEAPON4': '0.150', 'weapon4': '0.162', 'HITCOUNT': '0.170', 'weapon5': '0.268', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.540', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.374', 'weapon3': '1.490'} +[2023-09-14 15:04:16,180][63805] DAMAGECOUNT value on done: 12645.0 +[2023-09-14 15:04:16,181][63805] Sum rewards: 1.103, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.782', 'AMMO2': '0.013', 'AMMO5': '0.018', 'ARMOR': '0.040', 'WEAPON1': '0.040', 'AMMO4': '0.063', 'AMMO3': '0.124', 'WEAPON4': '0.150', 'weapon4': '0.164', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'weapon5': '0.416', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.999', 'weapon3': '1.268', 'weapon2': '1.820', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:16,475][63735] DAMAGECOUNT value on done: 16613.0 +[2023-09-14 15:04:16,475][63735] Sum rewards: 0.238, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.480', 'AMMO5': '0.003', 'AMMO2': '0.003', 'weapon5': '0.014', 'AMMO4': '0.016', 'WEAPON4': '0.050', 'WEAPON5': '0.050', 'ARMOR': '0.080', 'weapon4': '0.118', 'AMMO3': '0.123', 'HITCOUNT': '0.250', 'WEAPON3': '0.500', 'DAMAGECOUNT': '1.053', 'weapon2': '1.372', 'weapon3': '1.586', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:16,826][63732] Updated weights for policy 0, policy_version 2190 (0.0010) +[2023-09-14 15:04:17,851][63733] Updated weights for policy 1, policy_version 2360 (0.0011) +[2023-09-14 15:04:19,257][63734] DAMAGECOUNT value on done: 13454.0 +[2023-09-14 15:04:19,258][63734] Sum rewards: -3.160, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.588', 'AMMO2': '0.008', 'AMMO5': '0.023', 'AMMO4': '0.038', 'ARMOR': '0.040', 'weapon5': '0.068', 'WEAPON1': '0.070', 'AMMO3': '0.158', 'HITCOUNT': '0.190', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.720', 'WEAPON3': '0.950', 'weapon2': '1.606', 'weapon3': '1.958', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:04:19,658][63734] DAMAGECOUNT value on done: 13169.0 +[2023-09-14 15:04:19,659][63734] Sum rewards: -6.870, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.755', 'AMMO2': '0.012', 'AMMO5': '0.025', 'ARMOR': '0.036', 'WEAPON1': '0.040', 'AMMO4': '0.061', 'AMMO3': '0.115', 'weapon4': '0.116', 'weapon5': '0.136', 'HITCOUNT': '0.190', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.510', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.612', 'weapon2': '1.782'} +[2023-09-14 15:04:19,681][63771] DAMAGECOUNT value on done: 14355.0 +[2023-09-14 15:04:19,681][63771] Sum rewards: -2.159, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.631', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'AMMO5': '0.010', 'ARMOR': '0.068', 'weapon5': '0.128', 'AMMO3': '0.164', 'WEAPON5': '0.200', 'HITCOUNT': '0.280', 'WEAPON3': '1.100', 'weapon2': '1.204', 'DAMAGECOUNT': '1.266', 'FRAGCOUNT': '2.000', 'weapon3': '2.332'} +[2023-09-14 15:04:20,073][63771] DAMAGECOUNT value on done: 11094.0 +[2023-09-14 15:04:20,074][63771] Sum rewards: -5.165, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.074', 'AMMO5': '0.018', 'AMMO2': '0.019', 'ARMOR': '0.044', 'WEAPON4': '0.050', 'WEAPON1': '0.070', 'AMMO4': '0.096', 'weapon5': '0.104', 'AMMO3': '0.132', 'HITCOUNT': '0.220', 'WEAPON5': '0.250', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.870', 'weapon2': '1.390', 'FRAGCOUNT': '2.000', 'weapon3': '2.046'} +[2023-09-14 15:04:23,795][63733] Updated weights for policy 1, policy_version 2370 (0.0010) +[2023-09-14 15:04:25,109][63767] DAMAGECOUNT value on done: 15731.0 +[2023-09-14 15:04:25,109][63767] Sum rewards: -4.570, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'AMMO5': '0.015', 'ARMOR': '0.028', 'AMMO2': '0.033', 'WEAPON1': '0.050', 'WEAPON4': '0.100', 'AMMO3': '0.106', 'HITCOUNT': '0.130', 'HEALTH': '0.140', 'AMMO4': '0.166', 'weapon5': '0.170', 'WEAPON5': '0.250', 'weapon4': '0.336', 'DAMAGECOUNT': '0.366', 'WEAPON3': '0.500', 'weapon2': '1.032', 'weapon3': '1.758'} +[2023-09-14 15:04:25,229][63770] DAMAGECOUNT value on done: 15584.0 +[2023-09-14 15:04:25,230][63770] Sum rewards: 0.533, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.602', 'AMMO5': '0.020', 'AMMO2': '0.023', 'weapon4': '0.070', 'AMMO3': '0.084', 'WEAPON1': '0.110', 'AMMO4': '0.116', 'HITCOUNT': '0.150', 'WEAPON4': '0.150', 'weapon5': '0.236', 'WEAPON5': '0.450', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.891', 'weapon2': '1.214', 'weapon3': '1.570', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:25,520][63767] DAMAGECOUNT value on done: 18207.0 +[2023-09-14 15:04:25,667][63770] DAMAGECOUNT value on done: 12825.0 +[2023-09-14 15:04:25,668][63770] Sum rewards: 1.169, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.185', 'AMMO2': '0.010', 'AMMO5': '0.012', 'WEAPON1': '0.020', 'AMMO4': '0.048', 'ARMOR': '0.052', 'weapon7': '0.062', 'weapon5': '0.082', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.133', 'WEAPON5': '0.200', 'HITCOUNT': '0.320', 'WEAPON3': '0.800', 'weapon2': '1.380', 'DAMAGECOUNT': '1.395', 'weapon3': '1.790', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:04:26,341][63734] DAMAGECOUNT value on done: 16323.0 +[2023-09-14 15:04:26,341][63734] Sum rewards: -4.945, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.580', 'AMMO2': '0.002', 'AMMO4': '0.012', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'ARMOR': '0.028', 'AMMO3': '0.189', 'HITCOUNT': '0.190', 'weapon5': '0.192', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.858', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.192', 'weapon3': '1.934'} +[2023-09-14 15:04:26,433][63771] DAMAGECOUNT value on done: 12561.0 +[2023-09-14 15:04:26,434][63771] Sum rewards: -2.188, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.244', 'AMMO5': '0.007', 'AMMO2': '0.018', 'WEAPON1': '0.050', 'HITCOUNT': '0.060', 'ARMOR': '0.080', 'AMMO4': '0.091', 'AMMO3': '0.100', 'weapon4': '0.132', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.195', 'WEAPON5': '0.200', 'weapon5': '0.214', 'WEAPON3': '0.550', 'weapon3': '0.940', 'FRAGCOUNT': '1.000', 'weapon2': '1.768'} +[2023-09-14 15:04:26,481][63732] Updated weights for policy 0, policy_version 2200 (0.0011) +[2023-09-14 15:04:26,722][63734] DAMAGECOUNT value on done: 14090.0 +[2023-09-14 15:04:26,723][63734] Sum rewards: -2.174, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.515', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.023', 'WEAPON1': '0.040', 'weapon5': '0.068', 'AMMO3': '0.091', 'weapon4': '0.092', 'WEAPON4': '0.100', 'ARMOR': '0.128', 'HITCOUNT': '0.190', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.579', 'WEAPON3': '0.700', 'weapon3': '1.556', 'weapon2': '1.612', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:26,838][63771] DAMAGECOUNT value on done: 15510.0 +[2023-09-14 15:04:26,838][63771] Sum rewards: 0.402, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.149', 'AMMO4': '-0.002', 'AMMO2': '-0.000', 'WEAPON1': '0.010', 'AMMO5': '0.010', 'weapon4': '0.028', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO3': '0.117', 'WEAPON5': '0.200', 'HITCOUNT': '0.300', 'weapon5': '0.392', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.290', 'weapon2': '1.600', 'weapon3': '1.742', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:04:27,467][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002201_9015296.pth... +[2023-09-14 15:04:27,467][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000002376_9732096.pth... +[2023-09-14 15:04:27,518][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000001995_8171520.pth +[2023-09-14 15:04:27,528][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000001924_7880704.pth +[2023-09-14 15:04:27,535][63576] Saving new best policy, reward=-2.069! +[2023-09-14 15:04:27,720][63805] DAMAGECOUNT value on done: 15265.0 +[2023-09-14 15:04:27,721][63805] Sum rewards: -0.284, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.897', 'AMMO5': '0.010', 'AMMO2': '0.012', 'weapon5': '0.032', 'WEAPON1': '0.040', 'AMMO4': '0.057', 'AMMO3': '0.100', 'WEAPON5': '0.100', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'weapon4': '0.264', 'DAMAGECOUNT': '0.525', 'ARMOR': '0.545', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon2': '1.514', 'weapon3': '1.544'} +[2023-09-14 15:04:28,136][63805] DAMAGECOUNT value on done: 16411.0 +[2023-09-14 15:04:28,136][63805] Sum rewards: -1.987, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.850', 'AMMO4': '-0.034', 'AMMO2': '-0.007', 'AMMO5': '0.012', 'WEAPON1': '0.060', 'ARMOR': '0.069', 'AMMO3': '0.086', 'HITCOUNT': '0.180', 'WEAPON5': '0.300', 'weapon5': '0.542', 'DAMAGECOUNT': '0.660', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.312', 'weapon3': '1.682'} +[2023-09-14 15:04:28,703][63769] DAMAGECOUNT value on done: 16272.0 +[2023-09-14 15:04:28,704][63769] Sum rewards: -1.062, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.628', 'WEAPON1': '0.010', 'AMMO2': '0.015', 'AMMO5': '0.025', 'weapon4': '0.056', 'AMMO4': '0.075', 'WEAPON4': '0.100', 'AMMO3': '0.164', 'weapon5': '0.216', 'WEAPON5': '0.350', 'HITCOUNT': '0.380', 'WEAPON3': '0.900', 'weapon3': '1.502', 'DAMAGECOUNT': '1.590', 'weapon2': '1.682', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:04:29,030][63769] DAMAGECOUNT value on done: 11504.0 +[2023-09-14 15:04:29,031][63769] Sum rewards: -7.361, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.642', 'AMMO5': '0.003', 'weapon5': '0.008', 'WEAPON1': '0.010', 'AMMO2': '0.015', 'WEAPON5': '0.050', 'weapon4': '0.070', 'AMMO4': '0.074', 'ARMOR': '0.096', 'WEAPON4': '0.150', 'HITCOUNT': '0.180', 'AMMO3': '0.193', 'DAMAGECOUNT': '0.651', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon2': '1.130', 'weapon3': '2.352'} +[2023-09-14 15:04:29,247][63770] DAMAGECOUNT value on done: 13057.0 +[2023-09-14 15:04:29,248][63770] Sum rewards: 1.445, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.726', 'AMMO2': '0.001', 'AMMO4': '0.005', 'weapon5': '0.012', 'AMMO5': '0.023', 'WEAPON1': '0.040', 'ARMOR': '0.052', 'weapon7': '0.076', 'AMMO3': '0.079', 'weapon4': '0.142', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'HITCOUNT': '0.240', 'WEAPON5': '0.350', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.305', 'weapon3': '1.584', 'weapon2': '1.692', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:29,564][63733] Updated weights for policy 1, policy_version 2380 (0.0011) +[2023-09-14 15:04:29,632][63770] DAMAGECOUNT value on done: 14491.0 +[2023-09-14 15:04:29,696][63806] DAMAGECOUNT value on done: 13467.0 +[2023-09-14 15:04:30,020][63806] DAMAGECOUNT value on done: 13768.0 +[2023-09-14 15:04:30,021][63806] Sum rewards: 2.124, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.768', 'AMMO2': '0.003', 'AMMO5': '0.010', 'AMMO4': '0.013', 'weapon5': '0.018', 'WEAPON1': '0.050', 'WEAPON4': '0.050', 'AMMO3': '0.098', 'weapon4': '0.124', 'ARMOR': '0.140', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.714', 'weapon3': '1.494', 'weapon2': '1.818', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:04:32,462][63576] Saving new best policy, reward=-1.868! +[2023-09-14 15:04:32,469][63769] DAMAGECOUNT value on done: 14821.0 +[2023-09-14 15:04:32,469][63769] Sum rewards: 2.910, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.094', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.012', 'ARMOR': '0.015', 'WEAPON5': '0.050', 'AMMO4': '0.058', 'AMMO3': '0.090', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.112', 'weapon5': '0.138', 'WEAPON4': '0.150', 'HITCOUNT': '0.200', 'weapon4': '0.362', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.681', 'weapon2': '1.022', 'weapon3': '1.552', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:32,714][63735] DAMAGECOUNT value on done: 14809.0 +[2023-09-14 15:04:32,715][63735] Sum rewards: 1.488, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.455', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.020', 'ARMOR': '0.028', 'WEAPON1': '0.040', 'AMMO3': '0.050', 'WEAPON4': '0.050', 'weapon5': '0.080', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.126', 'weapon4': '0.138', 'HITCOUNT': '0.210', 'WEAPON5': '0.300', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.795', 'FRAGCOUNT': '1.000', 'weapon3': '1.142', 'weapon2': '1.774'} +[2023-09-14 15:04:32,865][63769] DAMAGECOUNT value on done: 12773.0 +[2023-09-14 15:04:32,866][63769] Sum rewards: 1.685, reward structure: {'DEATHCOUNT': '-1.500', 'HEALTH': '-0.625', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.005', 'HITCOUNT': '0.010', 'WEAPON1': '0.020', 'AMMO3': '0.036', 'DAMAGECOUNT': '0.045', 'WEAPON5': '0.100', 'WEAPON3': '0.200', 'weapon5': '0.490', 'ARMOR': '0.500', 'weapon3': '0.610', 'weapon2': '0.790', 'FRAGCOUNT': '1.000'} +[2023-09-14 15:04:33,104][63735] DAMAGECOUNT value on done: 11270.0 +[2023-09-14 15:04:33,105][63735] Sum rewards: -2.911, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.515', 'AMMO2': '0.016', 'AMMO5': '0.023', 'weapon4': '0.042', 'AMMO4': '0.077', 'WEAPON1': '0.090', 'WEAPON4': '0.100', 'AMMO3': '0.111', 'HITCOUNT': '0.130', 'weapon5': '0.350', 'WEAPON5': '0.450', 'DAMAGECOUNT': '0.585', 'WEAPON3': '0.750', 'weapon3': '1.530', 'weapon2': '1.600', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:04:33,523][63767] DAMAGECOUNT value on done: 15573.0 +[2023-09-14 15:04:33,906][63767] DAMAGECOUNT value on done: 15613.0 +[2023-09-14 15:04:33,906][63767] Sum rewards: -5.814, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-1.706', 'weapon5': '0.006', 'AMMO2': '0.006', 'AMMO5': '0.015', 'AMMO4': '0.030', 'ARMOR': '0.032', 'WEAPON4': '0.150', 'weapon4': '0.164', 'HITCOUNT': '0.190', 'AMMO3': '0.246', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.885', 'WEAPON3': '1.100', 'weapon2': '1.542', 'weapon3': '1.976', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:04:35,190][63733] Updated weights for policy 1, policy_version 2390 (0.0011) +[2023-09-14 15:04:37,032][63732] Updated weights for policy 0, policy_version 2210 (0.0010) +[2023-09-14 15:04:37,466][63576] Saving new best policy, reward=-1.802! +[2023-09-14 15:04:37,689][63806] DAMAGECOUNT value on done: 13149.0 +[2023-09-14 15:04:37,689][63806] Sum rewards: -0.350, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.612', 'AMMO5': '0.012', 'AMMO2': '0.027', 'WEAPON1': '0.040', 'AMMO3': '0.048', 'ARMOR': '0.098', 'HITCOUNT': '0.120', 'AMMO4': '0.136', 'weapon4': '0.202', 'WEAPON5': '0.250', 'WEAPON4': '0.250', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.540', 'weapon3': '0.864', 'weapon5': '0.896', 'FRAGCOUNT': '1.000', 'weapon2': '1.478'} +[2023-09-14 15:04:38,038][63806] DAMAGECOUNT value on done: 14037.0 +[2023-09-14 15:04:39,036][63805] DAMAGECOUNT value on done: 14692.0 +[2023-09-14 15:04:39,037][63805] Sum rewards: -0.648, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.826', 'AMMO5': '0.020', 'ARMOR': '0.024', 'AMMO2': '0.030', 'AMMO3': '0.085', 'WEAPON1': '0.090', 'WEAPON4': '0.100', 'weapon4': '0.102', 'AMMO4': '0.150', 'HITCOUNT': '0.160', 'WEAPON3': '0.350', 'weapon5': '0.386', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.639', 'weapon3': '0.928', 'FRAGCOUNT': '1.000', 'weapon2': '1.714'} +[2023-09-14 15:04:39,424][63805] DAMAGECOUNT value on done: 13085.0 +[2023-09-14 15:04:39,425][63805] Sum rewards: -2.130, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.103', 'AMMO2': '0.008', 'weapon5': '0.020', 'AMMO5': '0.022', 'ARMOR': '0.032', 'AMMO4': '0.042', 'WEAPON1': '0.070', 'weapon4': '0.074', 'WEAPON4': '0.100', 'AMMO3': '0.170', 'HITCOUNT': '0.250', 'WEAPON5': '0.450', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.320', 'weapon2': '1.686', 'weapon3': '1.828', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:04:40,850][63733] Updated weights for policy 1, policy_version 2400 (0.0010) +[2023-09-14 15:04:40,873][63735] DAMAGECOUNT value on done: 12307.0 +[2023-09-14 15:04:40,874][63735] Sum rewards: -5.679, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.716', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'ARMOR': '0.035', 'AMMO3': '0.147', 'HITCOUNT': '0.150', 'weapon5': '0.168', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.447', 'WEAPON3': '0.650', 'weapon2': '1.508', 'weapon3': '1.950'} +[2023-09-14 15:04:41,273][63735] DAMAGECOUNT value on done: 16892.0 +[2023-09-14 15:04:41,274][63735] Sum rewards: 2.543, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.514', 'AMMO5': '0.007', 'AMMO2': '0.015', 'WEAPON1': '0.040', 'AMMO4': '0.072', 'AMMO3': '0.087', 'weapon4': '0.088', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'weapon5': '0.178', 'HITCOUNT': '0.280', 'ARMOR': '0.570', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.837', 'weapon2': '1.486', 'weapon3': '1.796', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:04:42,462][63576] Saving new best policy, reward=-1.700! +[2023-09-14 15:04:43,158][63734] DAMAGECOUNT value on done: 13609.0 +[2023-09-14 15:04:43,159][63734] Sum rewards: -0.798, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.128', 'AMMO2': '0.011', 'AMMO5': '0.020', 'WEAPON1': '0.020', 'weapon4': '0.028', 'AMMO4': '0.055', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'AMMO3': '0.102', 'ARMOR': '0.125', 'weapon5': '0.160', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon3': '1.470', 'weapon2': '1.674'} +[2023-09-14 15:04:43,548][63734] DAMAGECOUNT value on done: 13527.0 +[2023-09-14 15:04:43,549][63734] Sum rewards: -1.336, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.766', 'AMMO2': '0.013', 'AMMO5': '0.018', 'weapon4': '0.020', 'ARMOR': '0.040', 'AMMO4': '0.063', 'WEAPON1': '0.090', 'WEAPON4': '0.150', 'AMMO3': '0.159', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'weapon5': '0.464', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.074', 'weapon2': '1.178', 'weapon3': '1.802', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:44,977][63771] DAMAGECOUNT value on done: 14470.0 +[2023-09-14 15:04:45,361][63771] DAMAGECOUNT value on done: 11274.0 +[2023-09-14 15:04:46,760][63733] Updated weights for policy 1, policy_version 2410 (0.0010) +[2023-09-14 15:04:47,159][63732] Updated weights for policy 0, policy_version 2220 (0.0011) +[2023-09-14 15:04:47,466][63576] Saving new best policy, reward=-1.695! +[2023-09-14 15:04:50,013][63767] DAMAGECOUNT value on done: 15914.0 +[2023-09-14 15:04:50,014][63767] Sum rewards: -2.821, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.720', 'AMMO5': '0.007', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'weapon5': '0.046', 'WEAPON4': '0.050', 'AMMO4': '0.059', 'HITCOUNT': '0.140', 'weapon4': '0.140', 'AMMO3': '0.177', 'WEAPON5': '0.200', 'ARMOR': '0.472', 'DAMAGECOUNT': '0.549', 'WEAPON3': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.434', 'weapon3': '1.692'} +[2023-09-14 15:04:50,446][63767] DAMAGECOUNT value on done: 18452.0 +[2023-09-14 15:04:50,446][63767] Sum rewards: -1.538, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.235', 'AMMO2': '0.009', 'AMMO5': '0.015', 'WEAPON1': '0.030', 'weapon4': '0.034', 'ARMOR': '0.036', 'AMMO4': '0.045', 'WEAPON4': '0.100', 'AMMO3': '0.121', 'HITCOUNT': '0.210', 'weapon5': '0.248', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.735', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.194', 'weapon3': '2.120'} +[2023-09-14 15:04:50,639][63770] DAMAGECOUNT value on done: 16023.0 +[2023-09-14 15:04:50,639][63770] Sum rewards: -0.041, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.066', 'AMMO2': '0.010', 'AMMO5': '0.012', 'weapon4': '0.028', 'AMMO4': '0.050', 'WEAPON1': '0.050', 'ARMOR': '0.088', 'WEAPON4': '0.100', 'AMMO3': '0.126', 'weapon5': '0.132', 'WEAPON5': '0.250', 'HITCOUNT': '0.370', 'WEAPON3': '0.850', 'weapon2': '1.262', 'DAMAGECOUNT': '1.317', 'weapon3': '2.130', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:51,048][63770] DAMAGECOUNT value on done: 13060.0 +[2023-09-14 15:04:51,049][63770] Sum rewards: -5.206, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.014', 'AMMO5': '0.003', 'AMMO2': '0.008', 'WEAPON1': '0.020', 'AMMO4': '0.042', 'weapon5': '0.074', 'WEAPON5': '0.100', 'weapon4': '0.142', 'HITCOUNT': '0.190', 'WEAPON4': '0.200', 'AMMO3': '0.202', 'ARMOR': '0.412', 'DAMAGECOUNT': '0.705', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.050', 'weapon2': '1.186', 'weapon3': '1.974'} +[2023-09-14 15:04:51,273][63805] DAMAGECOUNT value on done: 15507.0 +[2023-09-14 15:04:51,273][63805] Sum rewards: 0.183, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '0.005', 'AMMO5': '0.007', 'AMMO2': '0.010', 'weapon4': '0.034', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'AMMO4': '0.051', 'ARMOR': '0.068', 'AMMO3': '0.099', 'WEAPON5': '0.150', 'HITCOUNT': '0.200', 'weapon5': '0.222', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.726', 'FRAGCOUNT': '1.000', 'weapon2': '1.112', 'weapon3': '1.858'} +[2023-09-14 15:04:51,665][63805] DAMAGECOUNT value on done: 16706.0 +[2023-09-14 15:04:51,666][63805] Sum rewards: -3.628, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.760', 'AMMO4': '-0.008', 'AMMO2': '-0.002', 'AMMO5': '0.013', 'weapon4': '0.048', 'WEAPON1': '0.070', 'WEAPON4': '0.100', 'AMMO3': '0.134', 'weapon5': '0.196', 'WEAPON5': '0.250', 'HITCOUNT': '0.270', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.885', 'weapon2': '1.100', 'FRAGCOUNT': '2.000', 'weapon3': '2.226'} +[2023-09-14 15:04:51,716][63734] DAMAGECOUNT value on done: 16598.0 +[2023-09-14 15:04:51,717][63734] Sum rewards: -4.082, reward structure: {'DEATHCOUNT': '-10.500', 'AMMO2': '0.006', 'AMMO5': '0.007', 'ARMOR': '0.024', 'AMMO4': '0.028', 'HEALTH': '0.031', 'WEAPON4': '0.050', 'AMMO3': '0.126', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'weapon5': '0.294', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.825', 'weapon2': '1.020', 'weapon3': '2.386'} +[2023-09-14 15:04:51,938][63771] DAMAGECOUNT value on done: 12940.0 +[2023-09-14 15:04:51,939][63771] Sum rewards: -0.301, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.349', 'AMMO2': '0.010', 'AMMO5': '0.032', 'AMMO4': '0.050', 'WEAPON1': '0.050', 'AMMO3': '0.171', 'weapon5': '0.244', 'HITCOUNT': '0.360', 'ARMOR': '0.492', 'WEAPON5': '0.500', 'weapon2': '0.816', 'WEAPON3': '1.100', 'DAMAGECOUNT': '1.137', 'weapon3': '2.336', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:52,075][63734] DAMAGECOUNT value on done: 14420.0 +[2023-09-14 15:04:52,076][63734] Sum rewards: -0.055, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.195', 'AMMO2': '0.011', 'ARMOR': '0.016', 'AMMO5': '0.022', 'AMMO4': '0.057', 'WEAPON1': '0.080', 'WEAPON4': '0.100', 'weapon4': '0.132', 'AMMO3': '0.153', 'weapon5': '0.166', 'HITCOUNT': '0.270', 'WEAPON5': '0.450', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.990', 'weapon2': '1.452', 'weapon3': '1.690', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:04:52,336][63771] DAMAGECOUNT value on done: 15805.0 +[2023-09-14 15:04:52,336][63771] Sum rewards: -6.620, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.108', 'AMMO2': '0.007', 'AMMO5': '0.007', 'weapon5': '0.026', 'AMMO4': '0.036', 'WEAPON1': '0.060', 'ARMOR': '0.104', 'WEAPON5': '0.150', 'AMMO3': '0.166', 'weapon4': '0.188', 'HITCOUNT': '0.230', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.885', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon3': '1.616', 'weapon2': '1.812'} +[2023-09-14 15:04:52,802][63733] Updated weights for policy 1, policy_version 2420 (0.0011) +[2023-09-14 15:04:53,093][63806] DAMAGECOUNT value on done: 13635.0 +[2023-09-14 15:04:53,093][63806] Sum rewards: -3.274, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.980', 'weapon5': '0.008', 'AMMO5': '0.010', 'AMMO2': '0.011', 'WEAPON1': '0.030', 'AMMO4': '0.053', 'ARMOR': '0.125', 'AMMO3': '0.131', 'weapon4': '0.146', 'WEAPON4': '0.150', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.504', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.698', 'weapon2': '1.730'} +[2023-09-14 15:04:53,358][63770] DAMAGECOUNT value on done: 13376.0 +[2023-09-14 15:04:53,359][63770] Sum rewards: 1.305, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.475', 'AMMO2': '0.008', 'AMMO5': '0.015', 'AMMO4': '0.040', 'WEAPON1': '0.070', 'AMMO3': '0.091', 'HITCOUNT': '0.180', 'WEAPON5': '0.350', 'WEAPON3': '0.650', 'weapon5': '0.920', 'DAMAGECOUNT': '0.957', 'weapon3': '1.282', 'weapon2': '1.466', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:04:53,471][63806] DAMAGECOUNT value on done: 14238.0 +[2023-09-14 15:04:53,471][63806] Sum rewards: 5.599, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.624', 'AMMO4': '-0.008', 'AMMO2': '-0.002', 'weapon4': '0.022', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'AMMO3': '0.103', 'HITCOUNT': '0.360', 'ARMOR': '0.478', 'WEAPON3': '0.550', 'weapon2': '1.152', 'DAMAGECOUNT': '1.410', 'weapon3': '2.068', 'FRAGCOUNT': '6.000'} +[2023-09-14 15:04:53,728][63770] DAMAGECOUNT value on done: 14786.0 +[2023-09-14 15:04:53,729][63770] Sum rewards: -2.592, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.903', 'AMMO5': '0.010', 'AMMO2': '0.025', 'WEAPON1': '0.040', 'ARMOR': '0.088', 'AMMO3': '0.096', 'AMMO4': '0.126', 'weapon5': '0.138', 'weapon4': '0.196', 'WEAPON5': '0.200', 'HITCOUNT': '0.250', 'WEAPON4': '0.350', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.885', 'FRAGCOUNT': '1.000', 'weapon2': '1.614', 'weapon3': '1.642'} +[2023-09-14 15:04:54,003][63769] DAMAGECOUNT value on done: 16519.0 +[2023-09-14 15:04:54,004][63769] Sum rewards: -3.225, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.136', 'AMMO2': '0.007', 'AMMO5': '0.007', 'weapon5': '0.008', 'WEAPON1': '0.010', 'AMMO4': '0.035', 'WEAPON4': '0.050', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon4': '0.120', 'weapon7': '0.128', 'WEAPON5': '0.150', 'AMMO3': '0.173', 'HITCOUNT': '0.190', 'WEAPON7': '0.200', 'ARMOR': '0.448', 'DAMAGECOUNT': '0.741', 'weapon2': '0.762', 'WEAPON3': '1.000', 'FRAGCOUNT': '2.000', 'weapon3': '2.392'} +[2023-09-14 15:04:54,403][63769] DAMAGECOUNT value on done: 11749.0 +[2023-09-14 15:04:54,404][63769] Sum rewards: -0.264, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.751', 'AMMO2': '0.003', 'AMMO4': '0.017', 'WEAPON1': '0.020', 'AMMO5': '0.022', 'ARMOR': '0.080', 'weapon5': '0.082', 'AMMO3': '0.159', 'HITCOUNT': '0.200', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.735', 'WEAPON3': '0.850', 'weapon2': '1.616', 'weapon3': '1.852', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:04:55,823][63767] DAMAGECOUNT value on done: 15853.0 +[2023-09-14 15:04:55,823][63767] Sum rewards: -4.869, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.508', 'FRAGCOUNT': '-1.000', 'AMMO5': '0.014', 'AMMO2': '0.015', 'weapon4': '0.068', 'AMMO4': '0.073', 'ARMOR': '0.100', 'AMMO3': '0.117', 'weapon5': '0.156', 'WEAPON4': '0.200', 'HITCOUNT': '0.240', 'WEAPON5': '0.300', 'WEAPON3': '0.800', 'DAMAGECOUNT': '0.840', 'weapon2': '1.154', 'weapon3': '1.812'} +[2023-09-14 15:04:56,218][63767] DAMAGECOUNT value on done: 15825.0 +[2023-09-14 15:04:56,219][63767] Sum rewards: -0.150, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.888', 'AMMO5': '0.009', 'AMMO2': '0.016', 'WEAPON1': '0.030', 'ARMOR': '0.036', 'weapon7': '0.050', 'AMMO4': '0.078', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.145', 'WEAPON5': '0.150', 'HITCOUNT': '0.190', 'WEAPON7': '0.200', 'weapon4': '0.200', 'weapon5': '0.244', 'FRAGCOUNT': '0.500', 'DAMAGECOUNT': '0.636', 'WEAPON3': '0.650', 'weapon2': '0.684', 'weapon3': '1.830'} +[2023-09-14 15:04:56,245][63735] DAMAGECOUNT value on done: 14956.0 +[2023-09-14 15:04:56,245][63735] Sum rewards: 0.186, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.373', 'AMMO2': '0.009', 'AMMO5': '0.010', 'weapon5': '0.018', 'WEAPON1': '0.020', 'AMMO4': '0.044', 'weapon7': '0.050', 'ARMOR': '0.080', 'AMMO3': '0.093', 'WEAPON4': '0.100', 'HITCOUNT': '0.130', 'WEAPON5': '0.200', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'DAMAGECOUNT': '0.441', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.354', 'weapon3': '1.960'} +[2023-09-14 15:04:56,612][63735] DAMAGECOUNT value on done: 11517.0 +[2023-09-14 15:04:56,613][63735] Sum rewards: -2.808, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.580', 'AMMO5': '0.007', 'AMMO2': '0.015', 'ARMOR': '0.016', 'WEAPON1': '0.030', 'weapon5': '0.076', 'AMMO4': '0.077', 'WEAPON5': '0.150', 'AMMO3': '0.157', 'HITCOUNT': '0.230', 'DAMAGECOUNT': '0.741', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.254', 'weapon3': '2.218'} +[2023-09-14 15:04:57,124][63732] Updated weights for policy 0, policy_version 2230 (0.0010) +[2023-09-14 15:04:57,465][63576] Saving new best policy, reward=-1.607! +[2023-09-14 15:04:57,778][63769] DAMAGECOUNT value on done: 15001.0 +[2023-09-14 15:04:57,778][63769] Sum rewards: 0.281, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.419', 'AMMO5': '0.003', 'AMMO2': '0.009', 'WEAPON1': '0.020', 'AMMO4': '0.045', 'WEAPON5': '0.050', 'weapon7': '0.052', 'weapon4': '0.056', 'AMMO3': '0.074', 'WEAPON4': '0.100', 'weapon5': '0.116', 'HITCOUNT': '0.140', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'WEAPON3': '0.450', 'ARMOR': '0.529', 'DAMAGECOUNT': '0.540', 'FRAGCOUNT': '1.000', 'weapon3': '1.302', 'weapon2': '1.694'} +[2023-09-14 15:04:58,222][63769] DAMAGECOUNT value on done: 12883.0 +[2023-09-14 15:04:58,223][63769] Sum rewards: -1.831, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.770', 'ARMOR': '0.008', 'AMMO2': '0.008', 'AMMO5': '0.010', 'WEAPON1': '0.030', 'AMMO4': '0.042', 'weapon7': '0.050', 'HITCOUNT': '0.060', 'AMMO3': '0.061', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.104', 'weapon5': '0.150', 'AMMO6': '0.160', 'AMMO7': '0.160', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.350', 'FRAGCOUNT': '1.000', 'weapon3': '1.042', 'weapon2': '1.724'} +[2023-09-14 15:04:58,788][63733] Updated weights for policy 1, policy_version 2430 (0.0011) +[2023-09-14 15:05:02,309][63806] DAMAGECOUNT value on done: 13289.0 +[2023-09-14 15:05:02,730][63806] DAMAGECOUNT value on done: 14442.0 +[2023-09-14 15:05:02,730][63806] Sum rewards: 2.862, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.021', 'AMMO2': '0.017', 'AMMO5': '0.018', 'WEAPON4': '0.050', 'weapon7': '0.052', 'AMMO4': '0.083', 'AMMO3': '0.117', 'weapon5': '0.118', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon4': '0.198', 'WEAPON7': '0.200', 'HITCOUNT': '0.260', 'WEAPON5': '0.350', 'ARMOR': '0.412', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.215', 'weapon2': '1.528', 'weapon3': '1.676', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:05:04,078][63805] DAMAGECOUNT value on done: 15042.0 +[2023-09-14 15:05:04,079][63805] Sum rewards: -4.498, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.314', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.030', 'ARMOR': '0.056', 'weapon5': '0.062', 'weapon4': '0.062', 'WEAPON5': '0.100', 'AMMO4': '0.151', 'AMMO3': '0.162', 'HITCOUNT': '0.180', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.630', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.416', 'weapon3': '2.104'} +[2023-09-14 15:05:04,557][63805] DAMAGECOUNT value on done: 13175.0 +[2023-09-14 15:05:05,114][63733] Updated weights for policy 1, policy_version 2440 (0.0011) +[2023-09-14 15:05:05,580][63735] DAMAGECOUNT value on done: 12377.0 +[2023-09-14 15:05:05,951][63735] DAMAGECOUNT value on done: 17212.0 +[2023-09-14 15:05:05,951][63735] Sum rewards: 0.741, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.940', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'AMMO5': '0.020', 'ARMOR': '0.032', 'WEAPON1': '0.040', 'AMMO3': '0.085', 'HITCOUNT': '0.220', 'WEAPON5': '0.300', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.960', 'weapon5': '1.030', 'weapon2': '1.214', 'weapon3': '1.362', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:05:06,331][63732] Updated weights for policy 0, policy_version 2240 (0.0012) +[2023-09-14 15:05:07,045][63734] DAMAGECOUNT value on done: 14016.0 +[2023-09-14 15:05:07,046][63734] Sum rewards: 2.346, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.129', 'AMMO5': '0.013', 'AMMO2': '0.027', 'ARMOR': '0.044', 'WEAPON4': '0.050', 'WEAPON1': '0.050', 'AMMO3': '0.092', 'weapon4': '0.108', 'AMMO4': '0.136', 'HITCOUNT': '0.250', 'WEAPON5': '0.250', 'weapon5': '0.334', 'WEAPON3': '0.500', 'DAMAGECOUNT': '1.221', 'weapon3': '1.552', 'weapon2': '1.598', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:05:07,410][63734] DAMAGECOUNT value on done: 13566.0 +[2023-09-14 15:05:07,469][63576] Saving new best policy, reward=-1.512! +[2023-09-14 15:05:10,271][63771] DAMAGECOUNT value on done: 14835.0 +[2023-09-14 15:05:10,272][63771] Sum rewards: -0.693, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.364', 'AMMO2': '0.016', 'AMMO5': '0.022', 'ARMOR': '0.028', 'WEAPON4': '0.050', 'WEAPON1': '0.060', 'weapon4': '0.074', 'AMMO4': '0.077', 'AMMO3': '0.141', 'weapon5': '0.182', 'HITCOUNT': '0.260', 'WEAPON5': '0.450', 'WEAPON3': '0.950', 'weapon2': '0.960', 'DAMAGECOUNT': '1.095', 'weapon3': '2.306', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:05:10,609][63771] DAMAGECOUNT value on done: 11650.0 +[2023-09-14 15:05:10,609][63771] Sum rewards: -0.857, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.120', 'AMMO4': '-0.012', 'AMMO2': '-0.002', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'ARMOR': '0.052', 'AMMO3': '0.124', 'weapon5': '0.212', 'WEAPON5': '0.300', 'HITCOUNT': '0.310', 'WEAPON3': '0.750', 'weapon2': '1.068', 'DAMAGECOUNT': '1.128', 'FRAGCOUNT': '1.500', 'weapon3': '2.048'} +[2023-09-14 15:05:11,588][63733] Updated weights for policy 1, policy_version 2450 (0.0010) +[2023-09-14 15:05:12,461][63576] Saving new best policy, reward=-1.458! +[2023-09-14 15:05:14,736][63805] DAMAGECOUNT value on done: 15782.0 +[2023-09-14 15:05:14,736][63805] Sum rewards: 0.978, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.168', 'AMMO2': '0.013', 'AMMO5': '0.025', 'WEAPON1': '0.040', 'weapon4': '0.056', 'AMMO4': '0.064', 'ARMOR': '0.071', 'AMMO3': '0.098', 'HITCOUNT': '0.150', 'WEAPON4': '0.200', 'WEAPON5': '0.400', 'weapon5': '0.646', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.825', 'weapon2': '0.922', 'weapon3': '1.736', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:05:15,080][63732] Updated weights for policy 0, policy_version 2250 (0.0010) +[2023-09-14 15:05:15,113][63767] DAMAGECOUNT value on done: 16242.0 +[2023-09-14 15:05:15,113][63767] Sum rewards: -2.239, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.781', 'AMMO5': '0.010', 'AMMO2': '0.014', 'AMMO4': '0.071', 'WEAPON4': '0.150', 'AMMO3': '0.160', 'weapon5': '0.184', 'WEAPON5': '0.200', 'weapon4': '0.218', 'HITCOUNT': '0.290', 'ARMOR': '0.432', 'WEAPON3': '0.850', 'DAMAGECOUNT': '0.984', 'weapon2': '1.150', 'weapon3': '1.828', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:05:15,142][63805] DAMAGECOUNT value on done: 16849.0 +[2023-09-14 15:05:15,461][63767] DAMAGECOUNT value on done: 18623.0 +[2023-09-14 15:05:15,462][63767] Sum rewards: 1.098, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-1.145', 'AMMO5': '0.009', 'AMMO2': '0.019', 'WEAPON1': '0.020', 'AMMO3': '0.054', 'AMMO4': '0.093', 'HITCOUNT': '0.130', 'weapon5': '0.188', 'WEAPON5': '0.200', 'WEAPON4': '0.250', 'WEAPON3': '0.350', 'weapon4': '0.454', 'DAMAGECOUNT': '0.513', 'ARMOR': '0.545', 'weapon3': '0.752', 'FRAGCOUNT': '1.000', 'weapon2': '2.166'} +[2023-09-14 15:05:15,823][63770] DAMAGECOUNT value on done: 16143.0 +[2023-09-14 15:05:15,823][63770] Sum rewards: -2.672, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.661', 'AMMO2': '0.003', 'AMMO5': '0.015', 'AMMO4': '0.016', 'weapon4': '0.030', 'weapon5': '0.052', 'WEAPON1': '0.060', 'HITCOUNT': '0.060', 'ARMOR': '0.090', 'AMMO3': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.360', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.518', 'weapon2': '2.034'} +[2023-09-14 15:05:16,266][63770] DAMAGECOUNT value on done: 13288.0 +[2023-09-14 15:05:16,267][63770] Sum rewards: -4.346, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.184', 'AMMO4': '-0.011', 'AMMO2': '-0.002', 'AMMO5': '0.015', 'WEAPON1': '0.030', 'weapon5': '0.062', 'ARMOR': '0.108', 'WEAPON5': '0.150', 'AMMO3': '0.164', 'HITCOUNT': '0.240', 'DAMAGECOUNT': '0.684', 'WEAPON3': '1.050', 'weapon2': '1.318', 'FRAGCOUNT': '2.000', 'weapon3': '2.280'} +[2023-09-14 15:05:16,295][63806] DAMAGECOUNT value on done: 14162.0 +[2023-09-14 15:05:16,296][63806] Sum rewards: -1.969, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.072', 'AMMO2': '0.005', 'AMMO5': '0.025', 'AMMO4': '0.026', 'weapon5': '0.088', 'ARMOR': '0.092', 'WEAPON1': '0.120', 'AMMO3': '0.147', 'WEAPON4': '0.150', 'weapon4': '0.220', 'HITCOUNT': '0.470', 'WEAPON5': '0.500', 'WEAPON3': '0.900', 'weapon2': '1.312', 'DAMAGECOUNT': '1.581', 'weapon3': '1.966', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:05:16,616][63806] DAMAGECOUNT value on done: 14263.0 +[2023-09-14 15:05:17,124][63734] DAMAGECOUNT value on done: 16670.0 +[2023-09-14 15:05:17,125][63770] DAMAGECOUNT value on done: 13891.0 +[2023-09-14 15:05:17,125][63770] Sum rewards: 2.951, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.435', 'ARMOR': '0.016', 'AMMO5': '0.030', 'AMMO2': '0.034', 'WEAPON1': '0.090', 'weapon4': '0.102', 'WEAPON4': '0.150', 'AMMO3': '0.170', 'AMMO4': '0.171', 'HITCOUNT': '0.370', 'weapon5': '0.432', 'WEAPON5': '0.500', 'WEAPON3': '0.800', 'weapon2': '1.412', 'DAMAGECOUNT': '1.545', 'weapon3': '1.564', 'FRAGCOUNT': '6.000'} +[2023-09-14 15:05:17,199][63771] DAMAGECOUNT value on done: 13020.0 +[2023-09-14 15:05:17,467][63576] Saving new best policy, reward=-1.248! +[2023-09-14 15:05:17,498][63770] DAMAGECOUNT value on done: 15016.0 +[2023-09-14 15:05:17,498][63770] Sum rewards: -4.159, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-2.260', 'AMMO2': '0.010', 'AMMO5': '0.023', 'AMMO4': '0.049', 'WEAPON4': '0.050', 'weapon4': '0.050', 'ARMOR': '0.068', 'WEAPON1': '0.070', 'AMMO3': '0.121', 'HITCOUNT': '0.210', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.690', 'WEAPON3': '0.800', 'weapon5': '0.838', 'FRAGCOUNT': '1.000', 'weapon2': '1.326', 'weapon3': '1.446'} +[2023-09-14 15:05:17,516][63734] DAMAGECOUNT value on done: 14585.0 +[2023-09-14 15:05:17,516][63734] Sum rewards: -3.687, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.760', 'AMMO4': '-0.010', 'AMMO2': '-0.002', 'AMMO5': '0.025', 'WEAPON4': '0.100', 'WEAPON1': '0.100', 'weapon4': '0.100', 'HITCOUNT': '0.150', 'AMMO3': '0.178', 'weapon5': '0.204', 'DAMAGECOUNT': '0.495', 'WEAPON5': '0.500', 'WEAPON3': '0.650', 'weapon2': '1.510', 'weapon3': '1.822', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:05:17,621][63771] DAMAGECOUNT value on done: 16088.0 +[2023-09-14 15:05:17,621][63771] Sum rewards: 0.364, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.920', 'AMMO4': '-0.027', 'AMMO2': '-0.005', 'AMMO5': '0.018', 'WEAPON1': '0.060', 'ARMOR': '0.080', 'AMMO3': '0.087', 'weapon5': '0.248', 'HITCOUNT': '0.250', 'WEAPON5': '0.400', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.849', 'weapon3': '1.522', 'FRAGCOUNT': '2.000', 'weapon2': '2.002'} +[2023-09-14 15:05:18,236][63733] Updated weights for policy 1, policy_version 2460 (0.0011) +[2023-09-14 15:05:18,753][63767] DAMAGECOUNT value on done: 16662.0 +[2023-09-14 15:05:18,754][63767] Sum rewards: 4.178, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.095', 'AMMO2': '0.007', 'AMMO5': '0.011', 'ARMOR': '0.020', 'WEAPON1': '0.020', 'AMMO4': '0.036', 'WEAPON4': '0.050', 'AMMO3': '0.104', 'weapon4': '0.132', 'WEAPON5': '0.250', 'weapon5': '0.282', 'WEAPON3': '0.650', 'HITCOUNT': '0.680', 'weapon2': '1.100', 'weapon3': '2.004', 'DAMAGECOUNT': '2.427', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:05:19,089][63767] DAMAGECOUNT value on done: 15900.0 +[2023-09-14 15:05:19,090][63767] Sum rewards: -4.253, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.515', 'AMMO5': '0.005', 'AMMO2': '0.017', 'weapon5': '0.034', 'ARMOR': '0.040', 'HITCOUNT': '0.080', 'AMMO4': '0.085', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.127', 'DAMAGECOUNT': '0.225', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.230', 'weapon3': '2.268'} +[2023-09-14 15:05:19,351][63769] DAMAGECOUNT value on done: 17161.0 +[2023-09-14 15:05:19,352][63769] Sum rewards: 3.234, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.388', 'AMMO2': '0.005', 'AMMO5': '0.018', 'AMMO4': '0.024', 'WEAPON1': '0.040', 'ARMOR': '0.040', 'weapon7': '0.082', 'WEAPON4': '0.100', 'AMMO3': '0.127', 'weapon4': '0.184', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.280', 'WEAPON5': '0.350', 'weapon5': '0.424', 'WEAPON3': '0.800', 'weapon2': '1.102', 'weapon3': '1.770', 'DAMAGECOUNT': '1.926', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:05:19,807][63769] DAMAGECOUNT value on done: 12084.0 +[2023-09-14 15:05:19,807][63769] Sum rewards: 2.102, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.590', 'AMMO2': '0.005', 'AMMO4': '0.026', 'ARMOR': '0.028', 'AMMO5': '0.030', 'AMMO3': '0.082', 'WEAPON1': '0.090', 'WEAPON4': '0.100', 'weapon7': '0.118', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon4': '0.134', 'WEAPON7': '0.200', 'HITCOUNT': '0.270', 'WEAPON3': '0.550', 'weapon5': '0.576', 'WEAPON5': '0.600', 'DAMAGECOUNT': '1.005', 'weapon2': '1.094', 'weapon3': '1.544', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:05:21,135][63735] DAMAGECOUNT value on done: 15093.0 +[2023-09-14 15:05:21,135][63735] Sum rewards: 0.853, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.648', 'AMMO2': '0.009', 'AMMO5': '0.015', 'ARMOR': '0.036', 'AMMO4': '0.046', 'WEAPON1': '0.050', 'weapon5': '0.078', 'AMMO3': '0.085', 'weapon4': '0.104', 'HITCOUNT': '0.140', 'WEAPON4': '0.150', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.411', 'WEAPON3': '0.600', 'weapon3': '1.502', 'weapon2': '1.974', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:05:21,541][63735] DAMAGECOUNT value on done: 11838.0 +[2023-09-14 15:05:21,542][63735] Sum rewards: -4.243, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.232', 'AMMO2': '0.008', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO4': '0.039', 'ARMOR': '0.080', 'weapon5': '0.172', 'AMMO3': '0.197', 'WEAPON5': '0.200', 'HITCOUNT': '0.260', 'DAMAGECOUNT': '0.963', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.116', 'weapon3': '2.424'} +[2023-09-14 15:05:22,462][63576] Saving new best policy, reward=-1.104! +[2023-09-14 15:05:23,284][63769] DAMAGECOUNT value on done: 15181.0 +[2023-09-14 15:05:23,284][63769] Sum rewards: -0.045, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.660', 'AMMO5': '0.003', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO4': '0.019', 'WEAPON5': '0.050', 'AMMO3': '0.077', 'weapon5': '0.130', 'HITCOUNT': '0.180', 'ARMOR': '0.521', 'DAMAGECOUNT': '0.540', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'weapon2': '1.288', 'weapon3': '1.494'} +[2023-09-14 15:05:23,667][63769] DAMAGECOUNT value on done: 13018.0 +[2023-09-14 15:05:23,868][63732] Updated weights for policy 0, policy_version 2260 (0.0011) +[2023-09-14 15:05:25,123][63733] Updated weights for policy 1, policy_version 2470 (0.0017) +[2023-09-14 15:05:27,078][63806] DAMAGECOUNT value on done: 13454.0 +[2023-09-14 15:05:27,079][63806] Sum rewards: -1.193, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.708', 'AMMO5': '0.007', 'AMMO2': '0.011', 'WEAPON1': '0.030', 'AMMO4': '0.055', 'AMMO3': '0.100', 'WEAPON4': '0.100', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'weapon4': '0.168', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.550', 'weapon5': '0.934', 'FRAGCOUNT': '1.000', 'weapon2': '1.218', 'weapon3': '1.306'} +[2023-09-14 15:05:27,473][63806] DAMAGECOUNT value on done: 14891.0 +[2023-09-14 15:05:27,473][63806] Sum rewards: 2.912, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.214', 'AMMO5': '0.010', 'AMMO2': '0.019', 'weapon5': '0.028', 'WEAPON1': '0.030', 'WEAPON4': '0.050', 'AMMO4': '0.092', 'AMMO3': '0.184', 'WEAPON5': '0.200', 'HITCOUNT': '0.360', 'ARMOR': '0.400', 'WEAPON3': '0.800', 'weapon2': '1.294', 'DAMAGECOUNT': '1.347', 'weapon3': '2.312', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:05:29,378][63805] DAMAGECOUNT value on done: 15336.0 +[2023-09-14 15:05:29,378][63805] Sum rewards: -0.173, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO2': '0.005', 'AMMO5': '0.015', 'AMMO4': '0.025', 'HEALTH': '0.027', 'ARMOR': '0.042', 'AMMO3': '0.094', 'weapon5': '0.244', 'WEAPON5': '0.250', 'HITCOUNT': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.882', 'FRAGCOUNT': '1.000', 'weapon2': '1.476', 'weapon3': '1.716'} +[2023-09-14 15:05:29,782][63805] DAMAGECOUNT value on done: 13550.0 +[2023-09-14 15:05:29,783][63805] Sum rewards: -0.240, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.784', 'ARMOR': '0.004', 'AMMO2': '0.018', 'AMMO5': '0.025', 'AMMO3': '0.076', 'weapon4': '0.086', 'AMMO4': '0.090', 'WEAPON1': '0.120', 'WEAPON4': '0.150', 'HITCOUNT': '0.290', 'weapon5': '0.368', 'WEAPON3': '0.500', 'WEAPON5': '0.500', 'DAMAGECOUNT': '1.125', 'weapon2': '1.294', 'weapon3': '1.398', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:05:30,495][63735] DAMAGECOUNT value on done: 12820.0 +[2023-09-14 15:05:30,496][63735] Sum rewards: -4.927, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.572', 'AMMO4': '-0.054', 'AMMO2': '-0.011', 'AMMO5': '0.024', 'ARMOR': '0.052', 'AMMO3': '0.172', 'HITCOUNT': '0.230', 'weapon5': '0.256', 'WEAPON5': '0.400', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.329', 'weapon2': '1.348', 'weapon3': '1.998', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:05:30,886][63735] DAMAGECOUNT value on done: 17583.0 +[2023-09-14 15:05:30,886][63735] Sum rewards: 2.792, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.620', 'AMMO2': '0.000', 'AMMO4': '0.002', 'weapon4': '0.008', 'AMMO5': '0.017', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'WEAPON1': '0.090', 'AMMO3': '0.111', 'weapon5': '0.218', 'WEAPON5': '0.350', 'HITCOUNT': '0.370', 'WEAPON3': '0.650', 'DAMAGECOUNT': '1.113', 'weapon2': '1.328', 'weapon3': '2.064', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:05:31,776][63732] Updated weights for policy 0, policy_version 2270 (0.0011) +[2023-09-14 15:05:32,060][63733] Updated weights for policy 1, policy_version 2480 (0.0012) +[2023-09-14 15:05:32,461][63576] Saving new best policy, reward=-1.086! +[2023-09-14 15:05:32,901][63734] DAMAGECOUNT value on done: 14320.0 +[2023-09-14 15:05:32,901][63734] Sum rewards: -3.521, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.740', 'AMMO5': '0.012', 'AMMO2': '0.016', 'WEAPON1': '0.050', 'AMMO4': '0.078', 'AMMO3': '0.157', 'weapon5': '0.188', 'HITCOUNT': '0.250', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.912', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.308', 'weapon3': '1.998'} +[2023-09-14 15:05:33,244][63734] DAMAGECOUNT value on done: 14002.0 +[2023-09-14 15:05:33,244][63734] Sum rewards: -0.327, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.732', 'WEAPON1': '0.010', 'AMMO5': '0.012', 'AMMO2': '0.013', 'ARMOR': '0.040', 'AMMO4': '0.065', 'AMMO3': '0.117', 'weapon5': '0.184', 'WEAPON5': '0.200', 'HITCOUNT': '0.450', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.308', 'weapon2': '1.692', 'weapon3': '1.814', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:05:35,837][63771] DAMAGECOUNT value on done: 15083.0 +[2023-09-14 15:05:35,837][63771] Sum rewards: -2.859, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.052', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.016', 'AMMO5': '0.018', 'WEAPON1': '0.060', 'AMMO4': '0.080', 'AMMO3': '0.093', 'WEAPON4': '0.100', 'weapon4': '0.190', 'HITCOUNT': '0.280', 'WEAPON5': '0.350', 'WEAPON3': '0.450', 'weapon5': '0.480', 'DAMAGECOUNT': '0.744', 'weapon3': '1.150', 'weapon2': '1.432'} +[2023-09-14 15:05:36,193][63771] DAMAGECOUNT value on done: 11800.0 +[2023-09-14 15:05:36,194][63771] Sum rewards: -5.705, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-0.946', 'AMMO5': '0.015', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'AMMO4': '0.088', 'HITCOUNT': '0.090', 'AMMO3': '0.142', 'WEAPON4': '0.150', 'weapon4': '0.174', 'WEAPON5': '0.250', 'weapon5': '0.262', 'DAMAGECOUNT': '0.450', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon2': '1.238', 'weapon3': '1.758'} +[2023-09-14 15:05:37,466][63576] Saving new best policy, reward=-1.065! +[2023-09-14 15:05:38,277][63805] DAMAGECOUNT value on done: 15892.0 +[2023-09-14 15:05:38,678][63805] DAMAGECOUNT value on done: 17085.0 +[2023-09-14 15:05:38,679][63805] Sum rewards: -1.442, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.775', 'AMMO5': '0.010', 'AMMO2': '0.018', 'WEAPON1': '0.060', 'AMMO4': '0.091', 'AMMO3': '0.107', 'WEAPON4': '0.150', 'HITCOUNT': '0.170', 'WEAPON5': '0.200', 'weapon5': '0.224', 'weapon4': '0.248', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.708', 'weapon3': '1.522', 'weapon2': '1.524', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:05:39,083][63733] Updated weights for policy 1, policy_version 2490 (0.0010) +[2023-09-14 15:05:39,251][63806] DAMAGECOUNT value on done: 14512.0 +[2023-09-14 15:05:39,252][63806] Sum rewards: 1.440, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.053', 'AMMO2': '0.011', 'AMMO5': '0.028', 'weapon4': '0.038', 'ARMOR': '0.040', 'WEAPON4': '0.050', 'AMMO4': '0.056', 'WEAPON1': '0.080', 'AMMO3': '0.140', 'weapon5': '0.204', 'HITCOUNT': '0.250', 'WEAPON5': '0.350', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.050', 'weapon2': '1.470', 'weapon3': '1.826', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:05:39,593][63806] DAMAGECOUNT value on done: 14503.0 +[2023-09-14 15:05:39,594][63806] Sum rewards: -5.050, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.866', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO2': '0.030', 'weapon5': '0.052', 'ARMOR': '0.068', 'weapon4': '0.086', 'WEAPON5': '0.150', 'AMMO4': '0.151', 'AMMO3': '0.157', 'HITCOUNT': '0.210', 'WEAPON4': '0.400', 'DAMAGECOUNT': '0.720', 'WEAPON3': '0.800', 'FRAGCOUNT': '1.000', 'weapon3': '1.660', 'weapon2': '1.802'} +[2023-09-14 15:05:39,818][63732] Updated weights for policy 0, policy_version 2280 (0.0011) +[2023-09-14 15:05:40,166][63767] DAMAGECOUNT value on done: 16749.0 +[2023-09-14 15:05:40,166][63767] Sum rewards: -1.222, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.328', 'AMMO2': '0.010', 'AMMO5': '0.020', 'ARMOR': '0.032', 'AMMO4': '0.047', 'WEAPON4': '0.050', 'weapon4': '0.112', 'weapon5': '0.156', 'AMMO3': '0.212', 'HITCOUNT': '0.310', 'WEAPON5': '0.400', 'weapon2': '1.130', 'WEAPON3': '1.300', 'DAMAGECOUNT': '1.521', 'weapon3': '2.306', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:05:40,601][63767] DAMAGECOUNT value on done: 18798.0 +[2023-09-14 15:05:40,602][63767] Sum rewards: -5.913, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.724', 'AMMO2': '0.006', 'ARMOR': '0.016', 'AMMO5': '0.020', 'AMMO4': '0.028', 'WEAPON4': '0.050', 'weapon4': '0.076', 'WEAPON1': '0.090', 'AMMO3': '0.104', 'weapon5': '0.160', 'HITCOUNT': '0.180', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.525', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.362', 'weapon2': '1.794'} +[2023-09-14 15:05:40,746][63770] DAMAGECOUNT value on done: 13941.0 +[2023-09-14 15:05:40,746][63770] Sum rewards: -1.047, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.707', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.015', 'weapon5': '0.034', 'WEAPON5': '0.050', 'ARMOR': '0.060', 'HITCOUNT': '0.060', 'AMMO4': '0.074', 'AMMO3': '0.100', 'DAMAGECOUNT': '0.150', 'WEAPON4': '0.250', 'weapon4': '0.270', 'WEAPON3': '0.500', 'FRAGCOUNT': '1.000', 'weapon2': '1.416', 'weapon3': '1.668'} +[2023-09-14 15:05:41,120][63770] DAMAGECOUNT value on done: 15230.0 +[2023-09-14 15:05:41,121][63770] Sum rewards: -6.784, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.162', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.018', 'AMMO2': '0.024', 'ARMOR': '0.044', 'WEAPON4': '0.050', 'WEAPON1': '0.070', 'AMMO4': '0.118', 'HITCOUNT': '0.160', 'weapon4': '0.162', 'AMMO3': '0.164', 'weapon5': '0.174', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.642', 'WEAPON3': '1.000', 'weapon2': '1.050', 'weapon3': '2.102'} +[2023-09-14 15:05:41,227][63770] DAMAGECOUNT value on done: 16233.0 +[2023-09-14 15:05:41,228][63770] Sum rewards: -1.450, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.424', 'AMMO2': '0.000', 'AMMO4': '0.001', 'AMMO5': '0.010', 'AMMO3': '0.063', 'WEAPON1': '0.070', 'HITCOUNT': '0.100', 'WEAPON5': '0.200', 'weapon5': '0.256', 'DAMAGECOUNT': '0.270', 'ARMOR': '0.400', 'WEAPON3': '0.450', 'FRAGCOUNT': '1.000', 'weapon3': '1.404', 'weapon2': '1.500'} +[2023-09-14 15:05:41,530][63767] DAMAGECOUNT value on done: 16962.0 +[2023-09-14 15:05:41,530][63767] Sum rewards: -1.327, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.492', 'AMMO5': '0.010', 'ARMOR': '0.012', 'AMMO2': '0.022', 'weapon4': '0.090', 'WEAPON4': '0.100', 'AMMO4': '0.111', 'AMMO3': '0.146', 'WEAPON5': '0.150', 'weapon5': '0.198', 'HITCOUNT': '0.220', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.900', 'weapon2': '1.668', 'weapon3': '1.788', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:05:41,627][63770] DAMAGECOUNT value on done: 13869.0 +[2023-09-14 15:05:41,628][63770] Sum rewards: 0.980, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.840', 'AMMO4': '-0.044', 'AMMO2': '-0.009', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'WEAPON4': '0.050', 'weapon4': '0.060', 'AMMO3': '0.122', 'weapon5': '0.220', 'WEAPON5': '0.300', 'HITCOUNT': '0.400', 'WEAPON3': '0.800', 'weapon2': '1.474', 'weapon3': '1.666', 'DAMAGECOUNT': '1.743', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:05:41,877][63767] DAMAGECOUNT value on done: 16232.0 +[2023-09-14 15:05:41,878][63767] Sum rewards: -4.634, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.188', 'AMMO5': '0.010', 'AMMO2': '0.014', 'weapon4': '0.048', 'AMMO4': '0.068', 'ARMOR': '0.086', 'WEAPON4': '0.150', 'AMMO3': '0.162', 'weapon5': '0.166', 'WEAPON5': '0.200', 'HITCOUNT': '0.250', 'WEAPON3': '0.950', 'DAMAGECOUNT': '0.996', 'FRAGCOUNT': '1.000', 'weapon2': '1.426', 'weapon3': '2.028'} +[2023-09-14 15:05:42,776][63771] DAMAGECOUNT value on done: 13189.0 +[2023-09-14 15:05:42,776][63771] Sum rewards: -0.064, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.564', 'AMMO5': '0.007', 'AMMO2': '0.013', 'weapon4': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.067', 'ARMOR': '0.076', 'AMMO3': '0.135', 'weapon5': '0.138', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.800', 'weapon2': '1.162', 'weapon3': '1.734', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:05:42,930][63734] DAMAGECOUNT value on done: 16886.0 +[2023-09-14 15:05:42,930][63734] Sum rewards: -3.994, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.110', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.010', 'ARMOR': '0.024', 'weapon5': '0.074', 'AMMO3': '0.142', 'WEAPON5': '0.200', 'HITCOUNT': '0.250', 'DAMAGECOUNT': '0.648', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.470', 'weapon3': '2.186'} +[2023-09-14 15:05:43,177][63771] DAMAGECOUNT value on done: 16286.0 +[2023-09-14 15:05:43,288][63734] DAMAGECOUNT value on done: 15139.0 +[2023-09-14 15:05:43,288][63734] Sum rewards: 5.811, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.520', 'AMMO4': '-0.068', 'AMMO2': '-0.013', 'AMMO5': '0.010', 'weapon5': '0.032', 'ARMOR': '0.050', 'weapon4': '0.064', 'AMMO3': '0.080', 'WEAPON1': '0.100', 'WEAPON4': '0.100', 'WEAPON5': '0.200', 'HITCOUNT': '0.430', 'WEAPON3': '0.550', 'weapon3': '1.478', 'DAMAGECOUNT': '1.662', 'weapon2': '1.906', 'FRAGCOUNT': '6.000'} +[2023-09-14 15:05:44,646][63769] DAMAGECOUNT value on done: 17760.0 +[2023-09-14 15:05:44,646][63769] Sum rewards: 5.394, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.267', 'AMMO2': '0.009', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'weapon5': '0.030', 'AMMO4': '0.043', 'AMMO3': '0.092', 'weapon4': '0.168', 'WEAPON5': '0.200', 'WEAPON4': '0.200', 'HITCOUNT': '0.420', 'ARMOR': '0.452', 'WEAPON3': '0.700', 'weapon2': '1.552', 'weapon3': '1.710', 'DAMAGECOUNT': '1.797', 'FRAGCOUNT': '6.000'} +[2023-09-14 15:05:45,053][63769] DAMAGECOUNT value on done: 12175.0 +[2023-09-14 15:05:45,053][63769] Sum rewards: 0.520, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.583', 'AMMO2': '0.005', 'AMMO5': '0.007', 'AMMO4': '0.023', 'ARMOR': '0.024', 'WEAPON1': '0.050', 'AMMO3': '0.079', 'HITCOUNT': '0.110', 'WEAPON5': '0.150', 'DAMAGECOUNT': '0.273', 'WEAPON3': '0.450', 'weapon5': '0.694', 'FRAGCOUNT': '1.000', 'weapon3': '1.320', 'weapon2': '1.418'} +[2023-09-14 15:05:46,140][63735] DAMAGECOUNT value on done: 15303.0 +[2023-09-14 15:05:46,371][63769] DAMAGECOUNT value on done: 15385.0 +[2023-09-14 15:05:46,372][63769] Sum rewards: -0.503, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.010', 'AMMO4': '-0.039', 'AMMO2': '-0.008', 'AMMO5': '0.017', 'WEAPON1': '0.040', 'ARMOR': '0.054', 'WEAPON4': '0.100', 'AMMO3': '0.127', 'weapon4': '0.208', 'HITCOUNT': '0.210', 'WEAPON5': '0.400', 'weapon5': '0.492', 'DAMAGECOUNT': '0.612', 'WEAPON3': '0.900', 'weapon2': '1.104', 'weapon3': '1.790', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:05:46,459][63733] Updated weights for policy 1, policy_version 2500 (0.0010) +[2023-09-14 15:05:46,515][63735] DAMAGECOUNT value on done: 12438.0 +[2023-09-14 15:05:46,516][63735] Sum rewards: 1.430, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-1.242', 'AMMO5': '0.007', 'AMMO2': '0.012', 'WEAPON1': '0.020', 'ARMOR': '0.028', 'AMMO4': '0.061', 'weapon5': '0.080', 'WEAPON5': '0.100', 'AMMO3': '0.183', 'HITCOUNT': '0.380', 'WEAPON3': '0.950', 'weapon2': '1.236', 'DAMAGECOUNT': '1.800', 'weapon3': '2.314', 'FRAGCOUNT': '6.000'} +[2023-09-14 15:05:46,763][63769] DAMAGECOUNT value on done: 13234.0 +[2023-09-14 15:05:46,763][63769] Sum rewards: -4.530, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.705', 'AMMO2': '0.002', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO4': '0.010', 'weapon5': '0.020', 'ARMOR': '0.056', 'weapon7': '0.080', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.130', 'HITCOUNT': '0.180', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'DAMAGECOUNT': '0.648', 'WEAPON3': '0.850', 'FRAGCOUNT': '1.000', 'weapon2': '1.620', 'weapon3': '1.668'} +[2023-09-14 15:05:47,410][63732] Updated weights for policy 0, policy_version 2290 (0.0011) +[2023-09-14 15:05:51,910][63806] DAMAGECOUNT value on done: 13577.0 +[2023-09-14 15:05:51,911][63806] Sum rewards: -1.066, reward structure: {'DEATHCOUNT': '-3.750', 'HEALTH': '-1.125', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.008', 'AMMO5': '0.009', 'weapon5': '0.032', 'AMMO4': '0.040', 'weapon4': '0.044', 'AMMO3': '0.060', 'WEAPON1': '0.060', 'WEAPON4': '0.100', 'HITCOUNT': '0.130', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.369', 'WEAPON3': '0.450', 'weapon3': '1.346', 'weapon2': '1.460'} +[2023-09-14 15:05:52,285][63806] DAMAGECOUNT value on done: 15133.0 +[2023-09-14 15:05:52,286][63806] Sum rewards: -2.278, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.524', 'AMMO4': '-0.055', 'AMMO2': '-0.011', 'weapon5': '0.014', 'AMMO5': '0.015', 'WEAPON1': '0.080', 'AMMO3': '0.143', 'HITCOUNT': '0.190', 'WEAPON5': '0.300', 'ARMOR': '0.508', 'DAMAGECOUNT': '0.726', 'WEAPON3': '0.800', 'weapon2': '1.092', 'weapon3': '1.944', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:05:54,027][63733] Updated weights for policy 1, policy_version 2510 (0.0011) +[2023-09-14 15:05:54,507][63805] DAMAGECOUNT value on done: 15671.0 +[2023-09-14 15:05:54,508][63805] Sum rewards: 2.929, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.086', 'AMMO5': '0.010', 'AMMO2': '0.020', 'WEAPON1': '0.030', 'AMMO4': '0.101', 'AMMO3': '0.110', 'HITCOUNT': '0.130', 'weapon5': '0.136', 'WEAPON5': '0.200', 'ARMOR': '0.416', 'WEAPON3': '0.550', 'DAMAGECOUNT': '1.005', 'weapon2': '1.220', 'weapon3': '2.086', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:05:54,903][63805] DAMAGECOUNT value on done: 14057.0 +[2023-09-14 15:05:54,904][63805] Sum rewards: 0.108, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.783', 'AMMO2': '0.010', 'AMMO5': '0.017', 'ARMOR': '0.040', 'weapon4': '0.040', 'weapon7': '0.046', 'WEAPON4': '0.050', 'AMMO4': '0.052', 'WEAPON1': '0.070', 'weapon5': '0.100', 'AMMO3': '0.128', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'HITCOUNT': '0.330', 'WEAPON5': '0.350', 'WEAPON3': '0.900', 'weapon2': '1.252', 'DAMAGECOUNT': '1.521', 'weapon3': '2.134', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:05:54,984][63732] Updated weights for policy 0, policy_version 2300 (0.0011) +[2023-09-14 15:05:55,640][63735] DAMAGECOUNT value on done: 13255.0 +[2023-09-14 15:05:55,640][63735] Sum rewards: 2.317, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.463', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'ARMOR': '0.032', 'AMMO3': '0.101', 'WEAPON5': '0.150', 'HITCOUNT': '0.240', 'weapon5': '0.348', 'WEAPON3': '0.600', 'DAMAGECOUNT': '1.305', 'weapon2': '1.462', 'weapon3': '1.780', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:05:56,046][63735] DAMAGECOUNT value on done: 17804.0 +[2023-09-14 15:05:56,046][63735] Sum rewards: -1.224, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO5': '0.007', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.050', 'AMMO4': '0.092', 'WEAPON4': '0.100', 'weapon4': '0.102', 'AMMO3': '0.103', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'weapon5': '0.184', 'WEAPON3': '0.550', 'HEALTH': '0.592', 'DAMAGECOUNT': '0.663', 'FRAGCOUNT': '1.000', 'weapon2': '1.446', 'weapon3': '1.808'} +[2023-09-14 15:05:58,530][63734] DAMAGECOUNT value on done: 14430.0 +[2023-09-14 15:05:58,531][63734] Sum rewards: -3.992, reward structure: {'DEATHCOUNT': '-7.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.152', 'AMMO2': '0.011', 'AMMO5': '0.025', 'weapon4': '0.030', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'WEAPON1': '0.050', 'AMMO4': '0.055', 'AMMO3': '0.075', 'HITCOUNT': '0.100', 'weapon5': '0.224', 'DAMAGECOUNT': '0.330', 'WEAPON3': '0.400', 'WEAPON5': '0.450', 'weapon3': '1.510', 'weapon2': '1.818'} +[2023-09-14 15:05:58,911][63734] DAMAGECOUNT value on done: 14343.0 +[2023-09-14 15:05:58,911][63734] Sum rewards: -0.699, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.102', 'AMMO2': '0.005', 'AMMO5': '0.005', 'AMMO4': '0.022', 'ARMOR': '0.036', 'WEAPON1': '0.040', 'AMMO3': '0.152', 'HITCOUNT': '0.160', 'WEAPON5': '0.200', 'weapon5': '0.272', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.023', 'weapon2': '1.046', 'weapon3': '2.092', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:06:01,102][63805] DAMAGECOUNT value on done: 15962.0 +[2023-09-14 15:06:01,255][63771] DAMAGECOUNT value on done: 15308.0 +[2023-09-14 15:06:01,256][63771] Sum rewards: -1.546, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.490', 'AMMO2': '0.004', 'weapon7': '0.016', 'AMMO5': '0.020', 'AMMO4': '0.021', 'weapon5': '0.068', 'ARMOR': '0.070', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'WEAPON1': '0.100', 'AMMO3': '0.112', 'weapon4': '0.114', 'WEAPON4': '0.150', 'HITCOUNT': '0.210', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.675', 'WEAPON3': '0.700', 'weapon2': '1.132', 'FRAGCOUNT': '2.000', 'weapon3': '2.102'} +[2023-09-14 15:06:01,477][63805] DAMAGECOUNT value on done: 17405.0 +[2023-09-14 15:06:01,478][63805] Sum rewards: 1.900, reward structure: {'DEATHCOUNT': '-7.500', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'AMMO2': '0.032', 'ARMOR': '0.048', 'WEAPON5': '0.050', 'AMMO3': '0.116', 'AMMO4': '0.161', 'weapon4': '0.218', 'HITCOUNT': '0.250', 'WEAPON4': '0.300', 'HEALTH': '0.470', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.960', 'weapon3': '1.480', 'weapon2': '1.802', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:06:01,493][63733] Updated weights for policy 1, policy_version 2520 (0.0010) +[2023-09-14 15:06:01,715][63771] DAMAGECOUNT value on done: 12075.0 +[2023-09-14 15:06:01,715][63771] Sum rewards: -5.203, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.074', 'AMMO4': '-0.024', 'AMMO2': '-0.005', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'weapon5': '0.014', 'ARMOR': '0.060', 'AMMO3': '0.195', 'WEAPON5': '0.200', 'HITCOUNT': '0.290', 'DAMAGECOUNT': '0.825', 'FRAGCOUNT': '1.000', 'WEAPON3': '1.100', 'weapon2': '1.342', 'weapon3': '2.354'} +[2023-09-14 15:06:01,772][63806] DAMAGECOUNT value on done: 14558.0 +[2023-09-14 15:06:01,772][63806] Sum rewards: -5.624, reward structure: {'DEATHCOUNT': '-8.250', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.394', 'AMMO5': '0.007', 'AMMO2': '0.009', 'WEAPON1': '0.020', 'ARMOR': '0.028', 'AMMO4': '0.043', 'HITCOUNT': '0.080', 'AMMO3': '0.129', 'DAMAGECOUNT': '0.138', 'WEAPON5': '0.150', 'weapon5': '0.322', 'WEAPON3': '0.550', 'weapon3': '1.258', 'weapon2': '1.786'} +[2023-09-14 15:06:02,095][63806] DAMAGECOUNT value on done: 14863.0 +[2023-09-14 15:06:02,096][63806] Sum rewards: -2.390, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.900', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'AMMO5': '0.020', 'WEAPON1': '0.100', 'AMMO3': '0.150', 'weapon5': '0.258', 'HITCOUNT': '0.320', 'WEAPON5': '0.400', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.080', 'weapon2': '1.254', 'FRAGCOUNT': '2.000', 'weapon3': '2.086'} +[2023-09-14 15:06:02,470][63732] Updated weights for policy 0, policy_version 2310 (0.0011) +[2023-09-14 15:06:04,319][63767] DAMAGECOUNT value on done: 17262.0 +[2023-09-14 15:06:04,320][63767] Sum rewards: -2.326, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.060', 'AMMO2': '0.001', 'AMMO4': '0.003', 'AMMO5': '0.019', 'WEAPON1': '0.030', 'weapon5': '0.052', 'WEAPON4': '0.100', 'AMMO3': '0.135', 'weapon7': '0.154', 'weapon4': '0.174', 'HITCOUNT': '0.250', 'AMMO6': '0.300', 'WEAPON7': '0.300', 'AMMO7': '0.300', 'WEAPON5': '0.400', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.900', 'FRAGCOUNT': '1.000', 'weapon2': '1.026', 'weapon3': '1.940'} +[2023-09-14 15:06:04,685][63767] DAMAGECOUNT value on done: 16562.0 +[2023-09-14 15:06:04,685][63767] Sum rewards: -2.429, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.380', 'AMMO4': '-0.029', 'AMMO2': '-0.006', 'AMMO5': '0.003', 'WEAPON1': '0.030', 'weapon5': '0.056', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.167', 'weapon4': '0.198', 'HITCOUNT': '0.280', 'ARMOR': '0.516', 'WEAPON3': '0.950', 'DAMAGECOUNT': '0.990', 'weapon2': '1.254', 'weapon3': '2.092', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:06:05,265][63767] DAMAGECOUNT value on done: 17262.0 +[2023-09-14 15:06:05,265][63767] Sum rewards: -0.736, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.030', 'AMMO2': '0.005', 'AMMO5': '0.014', 'AMMO4': '0.023', 'weapon5': '0.090', 'WEAPON4': '0.100', 'weapon4': '0.102', 'AMMO3': '0.155', 'WEAPON5': '0.300', 'HITCOUNT': '0.390', 'ARMOR': '0.488', 'WEAPON3': '0.950', 'weapon2': '0.956', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.539', 'weapon3': '2.432'} +[2023-09-14 15:06:05,663][63767] DAMAGECOUNT value on done: 18861.0 +[2023-09-14 15:06:06,359][63770] DAMAGECOUNT value on done: 14100.0 +[2023-09-14 15:06:06,359][63770] Sum rewards: -1.328, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.332', 'AMMO2': '0.008', 'AMMO5': '0.013', 'AMMO4': '0.041', 'ARMOR': '0.112', 'AMMO3': '0.122', 'HITCOUNT': '0.130', 'WEAPON4': '0.150', 'WEAPON5': '0.250', 'weapon5': '0.368', 'weapon4': '0.390', 'DAMAGECOUNT': '0.477', 'WEAPON3': '0.650', 'weapon2': '0.900', 'FRAGCOUNT': '1.000', 'weapon3': '1.392'} +[2023-09-14 15:06:06,743][63770] DAMAGECOUNT value on done: 15344.0 +[2023-09-14 15:06:06,743][63770] Sum rewards: -3.997, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.086', 'AMMO5': '0.020', 'weapon4': '0.028', 'AMMO2': '0.033', 'WEAPON1': '0.070', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'AMMO3': '0.155', 'AMMO4': '0.166', 'weapon5': '0.260', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.342', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.000', 'weapon2': '1.154', 'weapon3': '2.100'} +[2023-09-14 15:06:06,823][63770] DAMAGECOUNT value on done: 16404.0 +[2023-09-14 15:06:06,823][63770] Sum rewards: -0.230, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-1.293', 'AMMO2': '0.011', 'AMMO5': '0.013', 'ARMOR': '0.024', 'WEAPON1': '0.050', 'AMMO4': '0.055', 'AMMO3': '0.101', 'HITCOUNT': '0.150', 'weapon5': '0.190', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.513', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.464', 'weapon3': '1.792'} +[2023-09-14 15:06:07,223][63770] DAMAGECOUNT value on done: 14687.0 +[2023-09-14 15:06:07,223][63770] Sum rewards: 2.531, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.662', 'AMMO2': '0.014', 'AMMO5': '0.020', 'WEAPON4': '0.050', 'AMMO4': '0.071', 'weapon7': '0.084', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.115', 'weapon4': '0.210', 'WEAPON5': '0.300', 'weapon5': '0.378', 'ARMOR': '0.440', 'WEAPON3': '0.500', 'HITCOUNT': '0.590', 'weapon2': '1.054', 'weapon3': '1.612', 'DAMAGECOUNT': '2.454', 'FRAGCOUNT': '2.500'} +[2023-09-14 15:06:08,195][63771] DAMAGECOUNT value on done: 13356.0 +[2023-09-14 15:06:08,482][63734] DAMAGECOUNT value on done: 17171.0 +[2023-09-14 15:06:08,483][63734] Sum rewards: 1.297, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.156', 'AMMO5': '0.005', 'AMMO2': '0.008', 'weapon5': '0.034', 'WEAPON1': '0.040', 'AMMO4': '0.042', 'WEAPON5': '0.100', 'AMMO3': '0.105', 'HITCOUNT': '0.140', 'ARMOR': '0.502', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.855', 'weapon2': '1.062', 'weapon3': '1.910', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:08,596][63771] DAMAGECOUNT value on done: 16716.0 +[2023-09-14 15:06:08,596][63771] Sum rewards: 0.161, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.538', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'ARMOR': '0.024', 'AMMO5': '0.025', 'WEAPON1': '0.070', 'AMMO3': '0.084', 'weapon5': '0.244', 'HITCOUNT': '0.380', 'WEAPON5': '0.500', 'WEAPON3': '0.550', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.290', 'weapon2': '1.394', 'weapon3': '1.896'} +[2023-09-14 15:06:08,874][63734] DAMAGECOUNT value on done: 15343.0 +[2023-09-14 15:06:08,874][63734] Sum rewards: 0.625, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.786', 'AMMO2': '0.011', 'AMMO5': '0.023', 'ARMOR': '0.028', 'weapon5': '0.038', 'AMMO4': '0.057', 'weapon7': '0.068', 'WEAPON1': '0.070', 'WEAPON4': '0.100', 'AMMO3': '0.104', 'weapon4': '0.112', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.170', 'WEAPON7': '0.200', 'WEAPON5': '0.350', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.612', 'FRAGCOUNT': '1.000', 'weapon3': '1.374', 'weapon2': '1.554'} +[2023-09-14 15:06:08,890][63733] Updated weights for policy 1, policy_version 2530 (0.0011) +[2023-09-14 15:06:09,603][63769] DAMAGECOUNT value on done: 15612.0 +[2023-09-14 15:06:09,603][63769] Sum rewards: -0.819, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.850', 'weapon4': '0.004', 'WEAPON1': '0.010', 'AMMO2': '0.017', 'AMMO5': '0.018', 'AMMO4': '0.084', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON4': '0.100', 'weapon7': '0.106', 'HITCOUNT': '0.120', 'AMMO3': '0.125', 'weapon5': '0.256', 'WEAPON5': '0.350', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.681', 'weapon3': '1.436', 'FRAGCOUNT': '1.500', 'weapon2': '1.824'} +[2023-09-14 15:06:09,968][63732] Updated weights for policy 0, policy_version 2320 (0.0011) +[2023-09-14 15:06:09,968][63769] DAMAGECOUNT value on done: 13699.0 +[2023-09-14 15:06:09,969][63769] Sum rewards: -0.606, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.230', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'AMMO5': '0.015', 'ARMOR': '0.021', 'AMMO4': '0.033', 'AMMO3': '0.181', 'weapon5': '0.208', 'WEAPON5': '0.300', 'HITCOUNT': '0.330', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.395', 'weapon2': '1.456', 'weapon3': '1.918', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:10,090][63769] DAMAGECOUNT value on done: 18244.0 +[2023-09-14 15:06:10,091][63769] Sum rewards: 0.117, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.214', 'AMMO4': '-0.009', 'AMMO2': '-0.002', 'AMMO5': '0.003', 'WEAPON1': '0.020', 'weapon5': '0.028', 'ARMOR': '0.043', 'WEAPON5': '0.050', 'AMMO3': '0.084', 'WEAPON4': '0.100', 'weapon4': '0.104', 'HITCOUNT': '0.370', 'WEAPON3': '0.650', 'weapon2': '1.258', 'DAMAGECOUNT': '1.452', 'weapon3': '1.930', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:10,482][63769] DAMAGECOUNT value on done: 12320.0 +[2023-09-14 15:06:10,482][63769] Sum rewards: -1.110, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.780', 'AMMO5': '0.007', 'AMMO2': '0.034', 'weapon4': '0.042', 'ARMOR': '0.068', 'WEAPON1': '0.070', 'HITCOUNT': '0.120', 'AMMO3': '0.131', 'weapon5': '0.164', 'AMMO4': '0.170', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.246', 'weapon3': '1.832'} +[2023-09-14 15:06:11,246][63735] DAMAGECOUNT value on done: 15353.0 +[2023-09-14 15:06:11,620][63735] DAMAGECOUNT value on done: 12883.0 +[2023-09-14 15:06:11,621][63735] Sum rewards: -2.409, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.442', 'AMMO2': '0.012', 'AMMO5': '0.015', 'weapon7': '0.022', 'AMMO4': '0.057', 'ARMOR': '0.068', 'weapon5': '0.082', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.120', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'weapon4': '0.218', 'WEAPON5': '0.300', 'WEAPON3': '0.750', 'weapon2': '1.236', 'DAMAGECOUNT': '1.335', 'weapon3': '1.888', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:16,287][63733] Updated weights for policy 1, policy_version 2540 (0.0010) +[2023-09-14 15:06:16,371][63806] DAMAGECOUNT value on done: 14012.0 +[2023-09-14 15:06:16,371][63806] Sum rewards: 0.063, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.308', 'weapon4': '0.002', 'AMMO2': '0.009', 'AMMO5': '0.018', 'ARMOR': '0.024', 'AMMO4': '0.043', 'WEAPON4': '0.050', 'WEAPON1': '0.070', 'AMMO3': '0.095', 'weapon5': '0.240', 'WEAPON5': '0.250', 'HITCOUNT': '0.350', 'WEAPON3': '0.500', 'weapon3': '1.236', 'DAMAGECOUNT': '1.305', 'weapon2': '1.680', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:16,739][63806] DAMAGECOUNT value on done: 15275.0 +[2023-09-14 15:06:16,739][63806] Sum rewards: 2.346, reward structure: {'DEATHCOUNT': '-3.000', 'HEALTH': '-0.487', 'AMMO5': '0.005', 'AMMO2': '0.005', 'weapon4': '0.010', 'AMMO4': '0.027', 'AMMO3': '0.040', 'WEAPON4': '0.050', 'WEAPON1': '0.070', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'weapon7': '0.118', 'WEAPON5': '0.150', 'HITCOUNT': '0.170', 'weapon5': '0.278', 'WEAPON3': '0.300', 'DAMAGECOUNT': '0.426', 'FRAGCOUNT': '1.000', 'weapon3': '1.152', 'weapon2': '1.732'} +[2023-09-14 15:06:17,432][63732] Updated weights for policy 0, policy_version 2330 (0.0011) +[2023-09-14 15:06:19,190][63805] DAMAGECOUNT value on done: 16181.0 +[2023-09-14 15:06:19,190][63805] Sum rewards: -1.101, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-0.120', 'AMMO2': '0.001', 'AMMO4': '0.006', 'AMMO5': '0.006', 'ARMOR': '0.016', 'weapon7': '0.052', 'weapon5': '0.058', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.150', 'AMMO3': '0.156', 'HITCOUNT': '0.300', 'WEAPON3': '0.900', 'weapon2': '1.406', 'DAMAGECOUNT': '1.530', 'weapon3': '2.138', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:06:19,635][63805] DAMAGECOUNT value on done: 14204.0 +[2023-09-14 15:06:20,709][63735] DAMAGECOUNT value on done: 13679.0 +[2023-09-14 15:06:20,709][63735] Sum rewards: -0.019, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.270', 'AMMO4': '-0.046', 'AMMO2': '-0.009', 'AMMO5': '0.014', 'ARMOR': '0.040', 'weapon7': '0.052', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon5': '0.140', 'AMMO3': '0.148', 'WEAPON7': '0.200', 'weapon4': '0.206', 'HITCOUNT': '0.230', 'WEAPON5': '0.350', 'WEAPON3': '0.950', 'weapon2': '0.996', 'DAMAGECOUNT': '1.272', 'weapon3': '2.118', 'FRAGCOUNT': '3.500'} +[2023-09-14 15:06:21,109][63735] DAMAGECOUNT value on done: 18359.0 +[2023-09-14 15:06:21,110][63735] Sum rewards: 0.028, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.086', 'AMMO2': '0.020', 'AMMO5': '0.025', 'WEAPON1': '0.030', 'weapon4': '0.036', 'weapon5': '0.060', 'ARMOR': '0.078', 'AMMO3': '0.098', 'AMMO4': '0.101', 'WEAPON4': '0.250', 'WEAPON5': '0.400', 'HITCOUNT': '0.410', 'WEAPON3': '0.500', 'weapon3': '1.436', 'DAMAGECOUNT': '1.665', 'weapon2': '2.004', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:06:23,657][63805] DAMAGECOUNT value on done: 16070.0 +[2023-09-14 15:06:23,658][63805] Sum rewards: -0.064, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.280', 'AMMO5': '0.007', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'weapon5': '0.024', 'ARMOR': '0.032', 'AMMO4': '0.088', 'AMMO3': '0.106', 'weapon4': '0.114', 'HITCOUNT': '0.120', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'DAMAGECOUNT': '0.324', 'WEAPON3': '0.600', 'weapon2': '1.166', 'FRAGCOUNT': '2.000', 'weapon3': '2.046'} +[2023-09-14 15:06:23,705][63733] Updated weights for policy 1, policy_version 2550 (0.0010) +[2023-09-14 15:06:23,859][63734] DAMAGECOUNT value on done: 14785.0 +[2023-09-14 15:06:23,860][63734] Sum rewards: -2.748, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.846', 'AMMO5': '0.009', 'AMMO2': '0.032', 'WEAPON1': '0.050', 'AMMO3': '0.081', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO4': '0.159', 'weapon4': '0.176', 'WEAPON5': '0.200', 'weapon5': '0.208', 'HITCOUNT': '0.260', 'WEAPON4': '0.300', 'WEAPON3': '0.400', 'FRAGCOUNT': '0.500', 'ARMOR': '0.522', 'weapon3': '0.974', 'DAMAGECOUNT': '1.065', 'weapon2': '1.862'} +[2023-09-14 15:06:24,020][63805] DAMAGECOUNT value on done: 17698.0 +[2023-09-14 15:06:24,021][63805] Sum rewards: -4.003, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.350', 'ARMOR': '0.008', 'AMMO5': '0.013', 'AMMO2': '0.023', 'weapon7': '0.048', 'WEAPON1': '0.060', 'weapon4': '0.074', 'AMMO3': '0.075', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO4': '0.115', 'weapon5': '0.136', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'WEAPON4': '0.250', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.879', 'FRAGCOUNT': '1.000', 'weapon3': '1.482', 'weapon2': '1.594'} +[2023-09-14 15:06:24,213][63806] DAMAGECOUNT value on done: 14727.0 +[2023-09-14 15:06:24,214][63806] Sum rewards: -6.119, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.172', 'AMMO5': '0.013', 'weapon5': '0.014', 'AMMO2': '0.023', 'weapon4': '0.032', 'WEAPON1': '0.040', 'ARMOR': '0.101', 'AMMO4': '0.114', 'AMMO3': '0.158', 'HITCOUNT': '0.180', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.162', 'weapon3': '2.310'} +[2023-09-14 15:06:24,265][63734] DAMAGECOUNT value on done: 14810.0 +[2023-09-14 15:06:24,266][63734] Sum rewards: 1.240, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.036', 'AMMO2': '0.005', 'AMMO5': '0.022', 'AMMO4': '0.026', 'ARMOR': '0.036', 'WEAPON1': '0.050', 'WEAPON4': '0.050', 'weapon4': '0.052', 'weapon5': '0.068', 'AMMO3': '0.169', 'HITCOUNT': '0.290', 'WEAPON5': '0.450', 'weapon2': '0.860', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.401', 'weapon3': '2.396', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:06:24,648][63806] DAMAGECOUNT value on done: 15236.0 +[2023-09-14 15:06:24,648][63806] Sum rewards: 0.732, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.166', 'AMMO5': '0.010', 'AMMO2': '0.021', 'WEAPON1': '0.040', 'AMMO4': '0.106', 'AMMO3': '0.140', 'WEAPON5': '0.200', 'HITCOUNT': '0.300', 'weapon5': '0.360', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.119', 'weapon3': '1.372', 'weapon2': '1.730', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:06:24,887][63732] Updated weights for policy 0, policy_version 2340 (0.0010) +[2023-09-14 15:06:26,664][63771] DAMAGECOUNT value on done: 15470.0 +[2023-09-14 15:06:27,047][63767] DAMAGECOUNT value on done: 17672.0 +[2023-09-14 15:06:27,047][63767] Sum rewards: -0.626, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.401', 'AMMO5': '0.010', 'AMMO2': '0.013', 'ARMOR': '0.048', 'AMMO4': '0.065', 'weapon5': '0.116', 'AMMO3': '0.131', 'WEAPON5': '0.150', 'HITCOUNT': '0.290', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.230', 'weapon2': '1.292', 'weapon3': '2.330'} +[2023-09-14 15:06:27,091][63771] DAMAGECOUNT value on done: 12212.0 +[2023-09-14 15:06:27,092][63771] Sum rewards: 1.601, reward structure: {'DEATHCOUNT': '-2.250', 'FRAGCOUNT': '-0.500', 'HEALTH': '-0.308', 'AMMO5': '0.007', 'WEAPON1': '0.020', 'AMMO2': '0.024', 'weapon7': '0.048', 'weapon5': '0.054', 'HITCOUNT': '0.080', 'AMMO3': '0.088', 'WEAPON5': '0.100', 'AMMO4': '0.120', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.204', 'WEAPON3': '0.250', 'DAMAGECOUNT': '0.411', 'ARMOR': '0.471', 'weapon2': '0.502', 'weapon3': '1.640'} +[2023-09-14 15:06:27,469][63767] DAMAGECOUNT value on done: 16827.0 +[2023-09-14 15:06:27,470][63767] Sum rewards: 1.357, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.682', 'AMMO5': '0.015', 'AMMO2': '0.022', 'WEAPON1': '0.050', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'weapon7': '0.100', 'AMMO3': '0.104', 'AMMO4': '0.107', 'weapon5': '0.172', 'WEAPON5': '0.200', 'HITCOUNT': '0.220', 'weapon4': '0.220', 'WEAPON4': '0.250', 'ARMOR': '0.424', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.795', 'weapon2': '0.978', 'weapon3': '2.032', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:06:27,475][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002343_9596928.pth... +[2023-09-14 15:06:27,475][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000002554_10461184.pth... +[2023-09-14 15:06:27,535][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000002155_8826880.pth +[2023-09-14 15:06:27,539][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002092_8568832.pth +[2023-09-14 15:06:30,131][63767] DAMAGECOUNT value on done: 17453.0 +[2023-09-14 15:06:30,131][63767] Sum rewards: -1.779, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.929', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.003', 'WEAPON1': '0.010', 'weapon5': '0.038', 'ARMOR': '0.044', 'WEAPON5': '0.050', 'weapon7': '0.050', 'AMMO3': '0.102', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.160', 'WEAPON7': '0.200', 'WEAPON4': '0.250', 'weapon4': '0.382', 'DAMAGECOUNT': '0.573', 'WEAPON3': '0.750', 'weapon2': '0.806', 'FRAGCOUNT': '1.000', 'weapon3': '1.498'} +[2023-09-14 15:06:30,534][63767] DAMAGECOUNT value on done: 19110.0 +[2023-09-14 15:06:30,534][63767] Sum rewards: -0.990, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.696', 'AMMO5': '0.017', 'AMMO2': '0.019', 'weapon4': '0.044', 'ARMOR': '0.048', 'WEAPON1': '0.050', 'AMMO4': '0.097', 'AMMO3': '0.115', 'HITCOUNT': '0.180', 'weapon5': '0.194', 'WEAPON4': '0.200', 'WEAPON5': '0.350', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.747', 'weapon3': '1.598', 'weapon2': '1.646', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:31,492][63733] Updated weights for policy 1, policy_version 2560 (0.0010) +[2023-09-14 15:06:31,887][63770] DAMAGECOUNT value on done: 14456.0 +[2023-09-14 15:06:31,888][63770] Sum rewards: -0.462, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO2': '0.027', 'WEAPON4': '0.050', 'ARMOR': '0.088', 'AMMO4': '0.134', 'AMMO3': '0.151', 'weapon4': '0.190', 'HITCOUNT': '0.370', 'HEALTH': '0.622', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'DAMAGECOUNT': '1.068', 'weapon2': '1.340', 'weapon3': '2.098'} +[2023-09-14 15:06:32,277][63770] DAMAGECOUNT value on done: 15474.0 +[2023-09-14 15:06:32,277][63770] Sum rewards: -3.823, reward structure: {'DEATHCOUNT': '-10.500', 'AMMO5': '0.020', 'AMMO2': '0.022', 'weapon4': '0.034', 'ARMOR': '0.040', 'WEAPON1': '0.040', 'weapon5': '0.078', 'HITCOUNT': '0.100', 'WEAPON4': '0.100', 'AMMO4': '0.109', 'AMMO3': '0.120', 'HEALTH': '0.280', 'DAMAGECOUNT': '0.390', 'WEAPON5': '0.400', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.532', 'weapon3': '1.812'} +[2023-09-14 15:06:32,362][63770] DAMAGECOUNT value on done: 16704.0 +[2023-09-14 15:06:32,362][63770] Sum rewards: -0.902, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.808', 'ARMOR': '0.008', 'AMMO5': '0.022', 'AMMO2': '0.031', 'WEAPON1': '0.050', 'weapon4': '0.058', 'AMMO3': '0.115', 'AMMO4': '0.155', 'HITCOUNT': '0.200', 'weapon5': '0.224', 'WEAPON5': '0.300', 'WEAPON4': '0.300', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.900', 'weapon2': '1.272', 'weapon3': '1.820', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:32,590][63732] Updated weights for policy 0, policy_version 2350 (0.0011) +[2023-09-14 15:06:32,749][63770] DAMAGECOUNT value on done: 15249.0 +[2023-09-14 15:06:32,749][63770] Sum rewards: 1.532, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.478', 'AMMO2': '0.008', 'weapon4': '0.010', 'AMMO5': '0.014', 'weapon5': '0.034', 'AMMO4': '0.039', 'WEAPON4': '0.050', 'WEAPON1': '0.060', 'AMMO3': '0.122', 'HITCOUNT': '0.300', 'WEAPON5': '0.300', 'ARMOR': '0.432', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.500', 'weapon2': '1.550', 'DAMAGECOUNT': '1.665', 'weapon3': '1.976'} +[2023-09-14 15:06:32,931][63769] DAMAGECOUNT value on done: 15695.0 +[2023-09-14 15:06:33,327][63769] DAMAGECOUNT value on done: 13948.0 +[2023-09-14 15:06:33,328][63769] Sum rewards: -6.397, reward structure: {'DEATHCOUNT': '-10.500', 'FRAGCOUNT': '-1.500', 'HEALTH': '-0.152', 'ARMOR': '0.008', 'AMMO2': '0.013', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.067', 'weapon5': '0.112', 'HITCOUNT': '0.180', 'AMMO3': '0.191', 'WEAPON5': '0.300', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.747', 'weapon2': '1.588', 'weapon3': '1.914'} +[2023-09-14 15:06:33,813][63771] DAMAGECOUNT value on done: 13702.0 +[2023-09-14 15:06:33,814][63771] Sum rewards: 1.159, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.454', 'AMMO5': '0.010', 'AMMO2': '0.011', 'WEAPON1': '0.030', 'AMMO4': '0.055', 'weapon7': '0.076', 'AMMO3': '0.097', 'AMMO6': '0.120', 'AMMO7': '0.120', 'WEAPON4': '0.150', 'WEAPON5': '0.200', 'WEAPON7': '0.200', 'weapon4': '0.220', 'HITCOUNT': '0.240', 'ARMOR': '0.620', 'WEAPON3': '0.700', 'DAMAGECOUNT': '1.038', 'weapon2': '1.400', 'weapon3': '1.826', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:06:34,069][63734] DAMAGECOUNT value on done: 17425.0 +[2023-09-14 15:06:34,069][63734] Sum rewards: 1.694, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.170', 'AMMO5': '0.005', 'AMMO2': '0.009', 'AMMO4': '0.046', 'AMMO3': '0.118', 'HITCOUNT': '0.120', 'WEAPON5': '0.150', 'weapon5': '0.168', 'ARMOR': '0.416', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.762', 'weapon2': '1.272', 'weapon3': '1.548', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:34,193][63771] DAMAGECOUNT value on done: 16958.0 +[2023-09-14 15:06:34,194][63771] Sum rewards: -1.688, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.017', 'AMMO2': '0.016', 'weapon4': '0.016', 'AMMO5': '0.028', 'ARMOR': '0.040', 'weapon5': '0.074', 'AMMO4': '0.078', 'WEAPON1': '0.090', 'AMMO3': '0.102', 'WEAPON4': '0.150', 'HITCOUNT': '0.180', 'WEAPON5': '0.550', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.726', 'FRAGCOUNT': '1.000', 'weapon2': '1.320', 'weapon3': '1.810'} +[2023-09-14 15:06:34,475][63734] DAMAGECOUNT value on done: 15463.0 +[2023-09-14 15:06:34,573][63770] Large shaping reward 2.614 for [('FRAGCOUNT', 2.0, 2.0), ('HITCOUNT', 0.03, 3.0), ('DAMAGECOUNT', 0.582, 194.0), ('weapon7', 0.002)] +[2023-09-14 15:06:35,610][63769] DAMAGECOUNT value on done: 18427.0 +[2023-09-14 15:06:35,610][63769] Sum rewards: -1.440, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.668', 'AMMO2': '0.009', 'AMMO5': '0.024', 'WEAPON1': '0.030', 'AMMO4': '0.047', 'WEAPON4': '0.050', 'weapon5': '0.060', 'weapon7': '0.070', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'ARMOR': '0.104', 'HITCOUNT': '0.130', 'AMMO3': '0.137', 'weapon4': '0.202', 'WEAPON5': '0.500', 'DAMAGECOUNT': '0.549', 'WEAPON3': '0.750', 'weapon2': '0.972', 'weapon3': '1.544', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:36,019][63769] DAMAGECOUNT value on done: 12486.0 +[2023-09-14 15:06:36,019][63769] Sum rewards: -2.940, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.348', 'weapon4': '0.006', 'AMMO5': '0.013', 'AMMO2': '0.034', 'weapon5': '0.058', 'WEAPON1': '0.080', 'AMMO3': '0.106', 'HITCOUNT': '0.140', 'AMMO4': '0.167', 'WEAPON5': '0.250', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.498', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.570', 'weapon3': '1.786'} +[2023-09-14 15:06:36,490][63735] DAMAGECOUNT value on done: 15522.0 +[2023-09-14 15:06:36,490][63735] Sum rewards: -3.746, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-2.560', 'weapon4': '0.002', 'AMMO2': '0.015', 'AMMO5': '0.025', 'AMMO4': '0.076', 'WEAPON1': '0.080', 'HITCOUNT': '0.120', 'AMMO3': '0.143', 'WEAPON4': '0.200', 'weapon5': '0.314', 'WEAPON5': '0.400', 'DAMAGECOUNT': '0.507', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.378', 'weapon3': '1.404'} +[2023-09-14 15:06:36,883][63735] DAMAGECOUNT value on done: 13097.0 +[2023-09-14 15:06:36,883][63735] Sum rewards: -4.025, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.143', 'AMMO2': '0.006', 'AMMO5': '0.012', 'weapon7': '0.016', 'AMMO4': '0.030', 'ARMOR': '0.044', 'WEAPON4': '0.050', 'WEAPON1': '0.050', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'AMMO3': '0.118', 'weapon4': '0.134', 'HITCOUNT': '0.180', 'weapon5': '0.248', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.642', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon2': '1.016', 'weapon3': '2.022'} +[2023-09-14 15:06:38,913][63733] Updated weights for policy 1, policy_version 2570 (0.0010) +[2023-09-14 15:06:40,126][63732] Updated weights for policy 0, policy_version 2360 (0.0011) +[2023-09-14 15:06:41,007][63806] DAMAGECOUNT value on done: 14431.0 +[2023-09-14 15:06:41,008][63806] Sum rewards: 2.199, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.406', 'weapon4': '0.012', 'AMMO5': '0.012', 'AMMO2': '0.021', 'ARMOR': '0.036', 'WEAPON1': '0.070', 'WEAPON4': '0.100', 'AMMO4': '0.103', 'AMMO3': '0.130', 'HITCOUNT': '0.210', 'weapon5': '0.266', 'WEAPON5': '0.300', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.257', 'weapon3': '1.474', 'weapon2': '1.614', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:06:41,426][63806] DAMAGECOUNT value on done: 15694.0 +[2023-09-14 15:06:41,427][63806] Sum rewards: 0.776, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.754', 'AMMO2': '0.004', 'AMMO5': '0.007', 'weapon5': '0.018', 'WEAPON1': '0.020', 'AMMO4': '0.022', 'ARMOR': '0.044', 'AMMO3': '0.119', 'WEAPON5': '0.150', 'HITCOUNT': '0.350', 'WEAPON3': '0.750', 'DAMAGECOUNT': '1.257', 'weapon2': '1.440', 'weapon3': '1.848', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:06:44,518][63805] DAMAGECOUNT value on done: 16446.0 +[2023-09-14 15:06:44,518][63805] Sum rewards: 1.940, reward structure: {'DEATHCOUNT': '-5.250', 'AMMO5': '0.003', 'AMMO2': '0.007', 'WEAPON1': '0.010', 'AMMO4': '0.034', 'WEAPON5': '0.050', 'WEAPON4': '0.050', 'AMMO3': '0.091', 'weapon4': '0.100', 'HEALTH': '0.104', 'weapon5': '0.168', 'HITCOUNT': '0.260', 'WEAPON3': '0.450', 'ARMOR': '0.452', 'DAMAGECOUNT': '0.795', 'weapon3': '1.140', 'weapon2': '1.476', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:44,986][63805] DAMAGECOUNT value on done: 14330.0 +[2023-09-14 15:06:45,908][63735] DAMAGECOUNT value on done: 13940.0 +[2023-09-14 15:06:45,909][63735] Sum rewards: -2.594, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.390', 'AMMO5': '0.015', 'AMMO2': '0.019', 'WEAPON1': '0.030', 'ARMOR': '0.040', 'weapon5': '0.064', 'AMMO4': '0.096', 'weapon4': '0.164', 'AMMO3': '0.178', 'WEAPON4': '0.200', 'WEAPON5': '0.250', 'HITCOUNT': '0.280', 'DAMAGECOUNT': '0.783', 'WEAPON3': '1.100', 'weapon2': '1.532', 'weapon3': '1.794', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:06:46,357][63733] Updated weights for policy 1, policy_version 2580 (0.0011) +[2023-09-14 15:06:46,358][63735] DAMAGECOUNT value on done: 18504.0 +[2023-09-14 15:06:46,359][63735] Sum rewards: -3.299, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.871', 'weapon4': '0.002', 'AMMO5': '0.015', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.064', 'AMMO4': '0.092', 'WEAPON4': '0.100', 'HITCOUNT': '0.110', 'weapon5': '0.116', 'AMMO3': '0.166', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.800', 'weapon3': '1.512', 'weapon2': '1.572', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:46,664][63806] DAMAGECOUNT value on done: 14995.0 +[2023-09-14 15:06:46,665][63806] Sum rewards: -4.164, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.438', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO2': '0.039', 'weapon4': '0.040', 'AMMO3': '0.116', 'AMMO4': '0.195', 'HITCOUNT': '0.230', 'WEAPON5': '0.250', 'WEAPON4': '0.300', 'weapon5': '0.388', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.804', 'FRAGCOUNT': '1.000', 'weapon3': '1.024', 'weapon2': '2.002'} +[2023-09-14 15:06:46,808][63805] DAMAGECOUNT value on done: 16119.0 +[2023-09-14 15:06:46,991][63806] DAMAGECOUNT value on done: 15526.0 +[2023-09-14 15:06:46,992][63806] Sum rewards: -1.489, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.296', 'AMMO5': '0.018', 'AMMO2': '0.023', 'WEAPON1': '0.060', 'weapon4': '0.060', 'weapon5': '0.084', 'AMMO4': '0.113', 'AMMO3': '0.119', 'WEAPON4': '0.150', 'HITCOUNT': '0.260', 'WEAPON5': '0.350', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.870', 'weapon2': '1.430', 'weapon3': '1.670', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:47,198][63805] DAMAGECOUNT value on done: 18010.0 +[2023-09-14 15:06:47,198][63805] Sum rewards: -3.945, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.980', 'AMMO2': '0.006', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.031', 'weapon4': '0.062', 'AMMO3': '0.135', 'WEAPON4': '0.150', 'weapon5': '0.160', 'HITCOUNT': '0.230', 'WEAPON5': '0.250', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.936', 'weapon3': '1.308', 'weapon2': '1.832', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:47,633][63732] Updated weights for policy 0, policy_version 2370 (0.0011) +[2023-09-14 15:06:49,678][63734] DAMAGECOUNT value on done: 14977.0 +[2023-09-14 15:06:49,678][63734] Sum rewards: 0.710, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.831', 'AMMO5': '0.015', 'AMMO2': '0.027', 'WEAPON1': '0.060', 'weapon4': '0.062', 'WEAPON4': '0.100', 'AMMO3': '0.102', 'AMMO4': '0.133', 'weapon5': '0.160', 'HITCOUNT': '0.170', 'WEAPON5': '0.300', 'ARMOR': '0.474', 'DAMAGECOUNT': '0.576', 'WEAPON3': '0.650', 'weapon2': '1.406', 'weapon3': '1.556', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:06:50,006][63767] DAMAGECOUNT value on done: 17924.0 +[2023-09-14 15:06:50,007][63767] Sum rewards: -1.667, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.320', 'AMMO2': '0.002', 'AMMO4': '0.010', 'AMMO5': '0.020', 'WEAPON1': '0.020', 'ARMOR': '0.024', 'weapon4': '0.046', 'weapon7': '0.086', 'WEAPON4': '0.100', 'AMMO3': '0.120', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.140', 'WEAPON7': '0.200', 'WEAPON5': '0.350', 'weapon5': '0.444', 'FRAGCOUNT': '0.500', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.756', 'weapon2': '1.272', 'weapon3': '1.372'} +[2023-09-14 15:06:50,076][63734] DAMAGECOUNT value on done: 15062.0 +[2023-09-14 15:06:50,076][63734] Sum rewards: -3.423, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.494', 'AMMO5': '0.005', 'WEAPON1': '0.010', 'AMMO2': '0.014', 'ARMOR': '0.048', 'weapon5': '0.066', 'AMMO4': '0.068', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon4': '0.118', 'AMMO3': '0.136', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.756', 'weapon3': '1.614', 'weapon2': '1.746', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:50,332][63767] DAMAGECOUNT value on done: 17117.0 +[2023-09-14 15:06:50,332][63767] Sum rewards: -2.233, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.006', 'AMMO2': '0.010', 'AMMO5': '0.015', 'WEAPON1': '0.020', 'AMMO4': '0.050', 'weapon5': '0.076', 'WEAPON4': '0.100', 'weapon4': '0.130', 'AMMO3': '0.136', 'AMMO6': '0.220', 'AMMO7': '0.220', 'weapon7': '0.220', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'WEAPON7': '0.300', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.870', 'FRAGCOUNT': '1.000', 'weapon3': '1.522', 'weapon2': '1.644'} +[2023-09-14 15:06:52,378][63771] DAMAGECOUNT value on done: 15710.0 +[2023-09-14 15:06:52,378][63771] Sum rewards: 0.478, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.007', 'weapon4': '0.008', 'AMMO2': '0.022', 'WEAPON1': '0.030', 'ARMOR': '0.032', 'WEAPON4': '0.050', 'AMMO4': '0.109', 'AMMO3': '0.126', 'WEAPON5': '0.150', 'weapon5': '0.150', 'HITCOUNT': '0.170', 'HEALTH': '0.296', 'WEAPON3': '0.450', 'DAMAGECOUNT': '0.720', 'FRAGCOUNT': '1.000', 'weapon3': '1.064', 'weapon2': '2.094'} +[2023-09-14 15:06:52,782][63771] DAMAGECOUNT value on done: 12397.0 +[2023-09-14 15:06:52,782][63771] Sum rewards: -2.187, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.596', 'AMMO4': '-0.025', 'AMMO2': '-0.005', 'weapon7': '0.002', 'AMMO5': '0.005', 'WEAPON1': '0.030', 'weapon4': '0.034', 'WEAPON4': '0.050', 'ARMOR': '0.064', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'HITCOUNT': '0.120', 'AMMO3': '0.141', 'WEAPON5': '0.150', 'weapon5': '0.192', 'DAMAGECOUNT': '0.555', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.220', 'weapon3': '2.126'} +[2023-09-14 15:06:53,892][63733] Updated weights for policy 1, policy_version 2590 (0.0011) +[2023-09-14 15:06:55,170][63732] Updated weights for policy 0, policy_version 2380 (0.0010) +[2023-09-14 15:06:55,219][63767] DAMAGECOUNT value on done: 17826.0 +[2023-09-14 15:06:55,219][63767] Sum rewards: 2.715, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO2': '0.012', 'AMMO5': '0.012', 'ARMOR': '0.024', 'WEAPON1': '0.040', 'WEAPON4': '0.050', 'HEALTH': '0.057', 'AMMO4': '0.059', 'weapon5': '0.080', 'weapon4': '0.120', 'WEAPON5': '0.150', 'AMMO3': '0.166', 'HITCOUNT': '0.250', 'WEAPON3': '0.700', 'weapon2': '0.920', 'DAMAGECOUNT': '1.119', 'weapon3': '1.706', 'FRAGCOUNT': '4.000'} +[2023-09-14 15:06:55,338][63734] Large shaping reward 2.632 for [('FRAGCOUNT', 2.0, 2.0), ('HITCOUNT', 0.03, 3.0), ('DAMAGECOUNT', 0.6, 200), ('weapon7', 0.002)] +[2023-09-14 15:06:55,606][63767] DAMAGECOUNT value on done: 19357.0 +[2023-09-14 15:06:55,607][63767] Sum rewards: -5.028, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.122', 'AMMO5': '0.016', 'weapon4': '0.018', 'AMMO2': '0.020', 'ARMOR': '0.035', 'weapon5': '0.040', 'WEAPON1': '0.050', 'AMMO4': '0.098', 'WEAPON4': '0.150', 'AMMO3': '0.206', 'HITCOUNT': '0.210', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.741', 'WEAPON3': '1.050', 'weapon2': '1.056', 'FRAGCOUNT': '2.000', 'weapon3': '2.054'} +[2023-09-14 15:06:56,059][63769] DAMAGECOUNT value on done: 15795.0 +[2023-09-14 15:06:56,060][63769] Sum rewards: 1.602, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.555', 'weapon4': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.011', 'AMMO5': '0.017', 'ARMOR': '0.032', 'AMMO4': '0.056', 'AMMO3': '0.066', 'WEAPON4': '0.100', 'HITCOUNT': '0.120', 'weapon5': '0.204', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.300', 'WEAPON3': '0.450', 'weapon3': '1.328', 'weapon2': '1.702', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:56,367][63769] DAMAGECOUNT value on done: 13998.0 +[2023-09-14 15:06:57,475][63770] DAMAGECOUNT value on done: 14965.0 +[2023-09-14 15:06:57,475][63770] Sum rewards: 0.965, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-0.996', 'AMMO2': '0.001', 'AMMO4': '0.007', 'AMMO5': '0.010', 'WEAPON1': '0.030', 'weapon7': '0.062', 'ARMOR': '0.072', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.107', 'weapon5': '0.162', 'HITCOUNT': '0.180', 'WEAPON3': '0.650', 'weapon3': '1.358', 'DAMAGECOUNT': '1.527', 'weapon2': '1.894', 'FRAGCOUNT': '6.000'} +[2023-09-14 15:06:57,896][63770] DAMAGECOUNT value on done: 15698.0 +[2023-09-14 15:06:57,983][63770] DAMAGECOUNT value on done: 17225.0 +[2023-09-14 15:06:57,984][63770] Sum rewards: 3.121, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.065', 'weapon4': '0.002', 'AMMO5': '0.017', 'AMMO2': '0.023', 'ARMOR': '0.032', 'WEAPON1': '0.080', 'WEAPON4': '0.100', 'AMMO3': '0.112', 'AMMO4': '0.116', 'weapon5': '0.126', 'WEAPON5': '0.350', 'HITCOUNT': '0.410', 'WEAPON3': '0.700', 'weapon2': '1.306', 'DAMAGECOUNT': '1.563', 'weapon3': '1.998', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:06:58,379][63770] DAMAGECOUNT value on done: 15585.0 +[2023-09-14 15:06:58,380][63770] Sum rewards: -4.740, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-0.960', 'AMMO2': '0.012', 'AMMO5': '0.015', 'WEAPON1': '0.030', 'AMMO4': '0.059', 'weapon5': '0.082', 'WEAPON4': '0.100', 'AMMO6': '0.100', 'WEAPON7': '0.100', 'AMMO7': '0.100', 'weapon4': '0.166', 'AMMO3': '0.182', 'HITCOUNT': '0.240', 'WEAPON5': '0.300', 'WEAPON3': '1.000', 'DAMAGECOUNT': '1.008', 'weapon2': '1.376', 'FRAGCOUNT': '2.000', 'weapon3': '2.100'} +[2023-09-14 15:06:59,344][63771] DAMAGECOUNT value on done: 13856.0 +[2023-09-14 15:06:59,345][63771] Sum rewards: -4.963, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-2.154', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.010', 'weapon4': '0.026', 'weapon7': '0.048', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon5': '0.144', 'HITCOUNT': '0.180', 'AMMO3': '0.184', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.462', 'WEAPON3': '1.100', 'weapon2': '1.708', 'weapon3': '1.794', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:06:59,610][63734] DAMAGECOUNT value on done: 17770.0 +[2023-09-14 15:06:59,610][63734] Sum rewards: -3.648, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.698', 'FRAGCOUNT': '-1.000', 'AMMO2': '0.007', 'AMMO5': '0.028', 'AMMO4': '0.034', 'WEAPON1': '0.040', 'AMMO3': '0.132', 'weapon5': '0.238', 'HITCOUNT': '0.290', 'WEAPON5': '0.450', 'WEAPON3': '0.900', 'DAMAGECOUNT': '1.035', 'weapon2': '1.118', 'weapon3': '2.278'} +[2023-09-14 15:06:59,739][63771] DAMAGECOUNT value on done: 17309.0 +[2023-09-14 15:06:59,740][63771] Sum rewards: -3.519, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.108', 'AMMO2': '0.011', 'AMMO5': '0.012', 'weapon4': '0.024', 'WEAPON1': '0.030', 'ARMOR': '0.032', 'AMMO4': '0.052', 'weapon5': '0.060', 'WEAPON4': '0.100', 'AMMO3': '0.179', 'WEAPON5': '0.250', 'HITCOUNT': '0.280', 'weapon2': '0.928', 'WEAPON3': '0.950', 'DAMAGECOUNT': '1.053', 'weapon3': '2.378', 'FRAGCOUNT': '2.500'} +[2023-09-14 15:07:00,038][63734] DAMAGECOUNT value on done: 15859.0 +[2023-09-14 15:07:00,038][63734] Sum rewards: -1.141, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-0.736', 'AMMO2': '0.014', 'AMMO5': '0.022', 'WEAPON1': '0.040', 'AMMO4': '0.071', 'AMMO3': '0.147', 'weapon5': '0.260', 'HITCOUNT': '0.340', 'WEAPON5': '0.400', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.188', 'weapon2': '1.490', 'weapon3': '1.822', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:07:00,930][63769] DAMAGECOUNT value on done: 18557.0 +[2023-09-14 15:07:00,930][63769] Sum rewards: -1.539, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.831', 'AMMO2': '0.001', 'AMMO5': '0.005', 'AMMO4': '0.006', 'ARMOR': '0.032', 'WEAPON1': '0.040', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'AMMO3': '0.136', 'weapon4': '0.194', 'weapon5': '0.224', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.650', 'FRAGCOUNT': '1.000', 'weapon2': '1.020', 'weapon3': '2.054'} +[2023-09-14 15:07:01,332][63769] DAMAGECOUNT value on done: 12616.0 +[2023-09-14 15:07:01,399][63733] Updated weights for policy 1, policy_version 2600 (0.0011) +[2023-09-14 15:07:01,679][63735] DAMAGECOUNT value on done: 15844.0 +[2023-09-14 15:07:01,680][63735] Sum rewards: -1.602, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.764', 'AMMO5': '0.012', 'AMMO2': '0.021', 'WEAPON1': '0.060', 'AMMO4': '0.105', 'AMMO3': '0.113', 'WEAPON5': '0.250', 'HITCOUNT': '0.260', 'weapon5': '0.272', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.966', 'weapon3': '1.424', 'weapon2': '1.878', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:07:02,134][63735] DAMAGECOUNT value on done: 13383.0 +[2023-09-14 15:07:02,135][63735] Sum rewards: -6.650, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.484', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.012', 'AMMO5': '0.015', 'ARMOR': '0.044', 'WEAPON1': '0.050', 'AMMO4': '0.061', 'weapon5': '0.112', 'WEAPON4': '0.150', 'weapon4': '0.220', 'AMMO3': '0.239', 'HITCOUNT': '0.240', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.858', 'weapon2': '0.972', 'WEAPON3': '1.150', 'weapon3': '2.110'} +[2023-09-14 15:07:02,679][63732] Updated weights for policy 0, policy_version 2390 (0.0010) +[2023-09-14 15:07:05,450][63806] DAMAGECOUNT value on done: 14567.0 +[2023-09-14 15:07:05,451][63806] Sum rewards: -1.686, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.218', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'ARMOR': '0.016', 'AMMO2': '0.035', 'AMMO3': '0.091', 'weapon4': '0.112', 'WEAPON5': '0.150', 'weapon5': '0.158', 'HITCOUNT': '0.160', 'AMMO4': '0.173', 'WEAPON4': '0.350', 'DAMAGECOUNT': '0.408', 'WEAPON3': '0.500', 'weapon2': '1.252', 'weapon3': '1.610', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:07:05,888][63806] DAMAGECOUNT value on done: 15826.0 +[2023-09-14 15:07:05,889][63806] Sum rewards: -2.416, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.030', 'FRAGCOUNT': '-0.500', 'AMMO2': '0.012', 'AMMO5': '0.017', 'WEAPON1': '0.060', 'AMMO4': '0.061', 'HITCOUNT': '0.090', 'AMMO3': '0.157', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.396', 'weapon5': '0.398', 'ARMOR': '0.524', 'WEAPON3': '0.800', 'weapon2': '1.012', 'weapon3': '2.086'} +[2023-09-14 15:07:08,778][63733] Updated weights for policy 1, policy_version 2610 (0.0012) +[2023-09-14 15:07:08,861][63806] DAMAGECOUNT value on done: 15208.0 +[2023-09-14 15:07:08,862][63806] Sum rewards: 2.691, reward structure: {'DEATHCOUNT': '-5.250', 'HEALTH': '-0.121', 'AMMO5': '0.003', 'AMMO2': '0.008', 'weapon4': '0.024', 'WEAPON1': '0.030', 'weapon5': '0.030', 'AMMO4': '0.037', 'WEAPON5': '0.050', 'AMMO3': '0.092', 'WEAPON4': '0.100', 'HITCOUNT': '0.200', 'ARMOR': '0.523', 'WEAPON3': '0.550', 'DAMAGECOUNT': '0.639', 'weapon2': '1.278', 'weapon3': '1.498', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:07:09,182][63806] DAMAGECOUNT value on done: 15746.0 +[2023-09-14 15:07:09,183][63806] Sum rewards: -5.527, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-2.305', 'FRAGCOUNT': '-0.500', 'AMMO4': '-0.023', 'AMMO2': '-0.005', 'weapon4': '0.010', 'AMMO5': '0.018', 'WEAPON1': '0.020', 'ARMOR': '0.064', 'weapon5': '0.092', 'WEAPON4': '0.100', 'AMMO3': '0.138', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.660', 'WEAPON3': '0.750', 'weapon3': '1.514', 'weapon2': '1.700'} +[2023-09-14 15:07:09,562][63805] DAMAGECOUNT value on done: 16429.0 +[2023-09-14 15:07:09,563][63805] Sum rewards: 2.880, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-0.310', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'AMMO2': '0.024', 'weapon4': '0.026', 'WEAPON4': '0.050', 'AMMO3': '0.067', 'weapon5': '0.094', 'WEAPON5': '0.100', 'AMMO4': '0.118', 'HITCOUNT': '0.210', 'WEAPON3': '0.400', 'DAMAGECOUNT': '0.930', 'weapon3': '1.252', 'weapon2': '1.394', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:07:09,650][63805] DAMAGECOUNT value on done: 16653.0 +[2023-09-14 15:07:09,651][63805] Sum rewards: -1.385, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.372', 'AMMO2': '0.003', 'AMMO4': '0.015', 'WEAPON1': '0.020', 'AMMO5': '0.023', 'AMMO3': '0.096', 'WEAPON4': '0.150', 'HITCOUNT': '0.160', 'weapon4': '0.194', 'WEAPON5': '0.400', 'weapon5': '0.456', 'ARMOR': '0.519', 'DAMAGECOUNT': '0.621', 'WEAPON3': '0.650', 'weapon3': '1.456', 'weapon2': '1.474', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:07:09,940][63805] DAMAGECOUNT value on done: 18433.0 +[2023-09-14 15:07:09,941][63805] Sum rewards: 5.488, reward structure: {'DEATHCOUNT': '-6.000', 'AMMO5': '0.007', 'WEAPON1': '0.010', 'AMMO2': '0.027', 'ARMOR': '0.053', 'AMMO3': '0.060', 'weapon4': '0.098', 'AMMO4': '0.132', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'weapon5': '0.232', 'WEAPON3': '0.250', 'HITCOUNT': '0.260', 'HEALTH': '0.895', 'weapon3': '1.152', 'DAMAGECOUNT': '1.269', 'weapon2': '1.742', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:07:10,025][63805] DAMAGECOUNT value on done: 14437.0 +[2023-09-14 15:07:10,107][63732] Updated weights for policy 0, policy_version 2400 (0.0011) +[2023-09-14 15:07:11,177][63735] DAMAGECOUNT value on done: 14120.0 +[2023-09-14 15:07:11,178][63735] Sum rewards: -3.314, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.580', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'AMMO2': '0.029', 'weapon4': '0.030', 'WEAPON4': '0.050', 'ARMOR': '0.108', 'AMMO4': '0.142', 'AMMO3': '0.163', 'WEAPON5': '0.200', 'HITCOUNT': '0.210', 'DAMAGECOUNT': '0.540', 'WEAPON3': '0.950', 'weapon2': '1.638', 'weapon3': '1.926', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:07:11,504][63735] DAMAGECOUNT value on done: 18602.0 +[2023-09-14 15:07:12,773][63767] DAMAGECOUNT value on done: 18054.0 +[2023-09-14 15:07:13,144][63767] DAMAGECOUNT value on done: 17416.0 +[2023-09-14 15:07:13,144][63767] Sum rewards: -3.740, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-2.620', 'AMMO4': '-0.034', 'AMMO2': '-0.007', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'weapon5': '0.046', 'ARMOR': '0.096', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'AMMO3': '0.201', 'weapon4': '0.204', 'HITCOUNT': '0.280', 'DAMAGECOUNT': '0.897', 'WEAPON3': '0.950', 'weapon3': '1.770', 'weapon2': '1.796', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:07:14,999][63734] DAMAGECOUNT value on done: 15262.0 +[2023-09-14 15:07:15,000][63734] Sum rewards: 0.389, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.587', 'AMMO2': '0.013', 'AMMO5': '0.020', 'ARMOR': '0.024', 'weapon4': '0.024', 'weapon5': '0.028', 'AMMO4': '0.063', 'WEAPON1': '0.080', 'AMMO3': '0.083', 'WEAPON4': '0.150', 'HITCOUNT': '0.200', 'WEAPON5': '0.400', 'WEAPON3': '0.600', 'DAMAGECOUNT': '0.855', 'weapon2': '1.520', 'weapon3': '1.666', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:07:15,431][63734] DAMAGECOUNT value on done: 15527.0 +[2023-09-14 15:07:15,432][63734] Sum rewards: 1.074, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.070', 'AMMO2': '0.007', 'AMMO5': '0.011', 'AMMO4': '0.033', 'WEAPON1': '0.040', 'ARMOR': '0.060', 'weapon5': '0.074', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'AMMO3': '0.110', 'weapon7': '0.172', 'HITCOUNT': '0.240', 'WEAPON5': '0.250', 'WEAPON3': '0.650', 'weapon2': '1.050', 'DAMAGECOUNT': '1.350', 'weapon3': '2.046', 'FRAGCOUNT': '2.500'} +[2023-09-14 15:07:16,055][63733] Updated weights for policy 1, policy_version 2620 (0.0011) +[2023-09-14 15:07:17,770][63771] DAMAGECOUNT value on done: 15964.0 +[2023-09-14 15:07:17,770][63771] Sum rewards: -0.462, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.958', 'AMMO2': '0.007', 'AMMO5': '0.012', 'AMMO4': '0.035', 'ARMOR': '0.036', 'WEAPON1': '0.050', 'weapon5': '0.054', 'AMMO3': '0.097', 'WEAPON4': '0.100', 'weapon4': '0.118', 'HITCOUNT': '0.180', 'WEAPON5': '0.250', 'WEAPON3': '0.700', 'DAMAGECOUNT': '0.762', 'FRAGCOUNT': '1.000', 'weapon2': '1.322', 'weapon3': '1.772'} +[2023-09-14 15:07:17,890][63732] Updated weights for policy 0, policy_version 2410 (0.0010) +[2023-09-14 15:07:18,230][63771] DAMAGECOUNT value on done: 12586.0 +[2023-09-14 15:07:18,231][63771] Sum rewards: 0.189, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.180', 'AMMO4': '-0.003', 'AMMO2': '-0.001', 'AMMO5': '0.012', 'WEAPON1': '0.050', 'weapon7': '0.058', 'AMMO3': '0.060', 'AMMO6': '0.100', 'AMMO7': '0.100', 'WEAPON7': '0.100', 'HITCOUNT': '0.110', 'weapon5': '0.168', 'WEAPON5': '0.300', 'WEAPON3': '0.400', 'ARMOR': '0.500', 'DAMAGECOUNT': '0.567', 'weapon3': '1.226', 'weapon2': '1.622', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:07:19,091][63769] DAMAGECOUNT value on done: 15938.0 +[2023-09-14 15:07:19,092][63769] Sum rewards: 0.786, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-1.470', 'AMMO2': '0.001', 'AMMO4': '0.004', 'weapon7': '0.006', 'AMMO5': '0.009', 'WEAPON1': '0.020', 'weapon4': '0.042', 'HITCOUNT': '0.060', 'WEAPON4': '0.100', 'AMMO3': '0.108', 'WEAPON5': '0.150', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'weapon5': '0.268', 'DAMAGECOUNT': '0.429', 'ARMOR': '0.503', 'WEAPON3': '0.700', 'weapon2': '1.510', 'weapon3': '1.746', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:07:19,453][63769] DAMAGECOUNT value on done: 14170.0 +[2023-09-14 15:07:19,453][63769] Sum rewards: -0.249, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.928', 'AMMO4': '-0.013', 'AMMO2': '-0.003', 'AMMO5': '0.012', 'ARMOR': '0.032', 'WEAPON1': '0.040', 'weapon7': '0.066', 'AMMO3': '0.092', 'AMMO6': '0.120', 'AMMO7': '0.120', 'HITCOUNT': '0.130', 'weapon5': '0.142', 'WEAPON7': '0.200', 'WEAPON5': '0.250', 'DAMAGECOUNT': '0.516', 'WEAPON3': '0.600', 'FRAGCOUNT': '1.000', 'weapon2': '1.626', 'weapon3': '1.748'} +[2023-09-14 15:07:20,275][63767] DAMAGECOUNT value on done: 18064.0 +[2023-09-14 15:07:20,276][63767] Sum rewards: -0.090, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.820', 'AMMO4': '-0.007', 'AMMO2': '-0.001', 'AMMO5': '0.020', 'WEAPON1': '0.020', 'WEAPON4': '0.100', 'AMMO3': '0.136', 'HITCOUNT': '0.230', 'weapon5': '0.232', 'WEAPON5': '0.350', 'ARMOR': '0.496', 'DAMAGECOUNT': '0.714', 'WEAPON3': '0.900', 'weapon2': '1.260', 'FRAGCOUNT': '2.000', 'weapon3': '2.030'} +[2023-09-14 15:07:20,679][63767] DAMAGECOUNT value on done: 19457.0 +[2023-09-14 15:07:22,737][63770] DAMAGECOUNT value on done: 15316.0 +[2023-09-14 15:07:22,737][63770] Sum rewards: 0.819, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.197', 'AMMO4': '-0.015', 'AMMO2': '-0.003', 'AMMO5': '0.010', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'AMMO3': '0.121', 'WEAPON5': '0.250', 'weapon5': '0.250', 'HITCOUNT': '0.320', 'WEAPON3': '0.550', 'DAMAGECOUNT': '1.053', 'weapon2': '1.140', 'FRAGCOUNT': '2.000', 'weapon3': '2.034'} +[2023-09-14 15:07:23,121][63733] Updated weights for policy 1, policy_version 2630 (0.0011) +[2023-09-14 15:07:23,169][63770] DAMAGECOUNT value on done: 15938.0 +[2023-09-14 15:07:23,170][63770] Sum rewards: -4.391, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.086', 'AMMO5': '0.007', 'AMMO2': '0.012', 'weapon4': '0.014', 'WEAPON1': '0.040', 'AMMO4': '0.058', 'AMMO3': '0.102', 'WEAPON5': '0.150', 'WEAPON4': '0.150', 'HITCOUNT': '0.220', 'WEAPON3': '0.650', 'DAMAGECOUNT': '0.720', 'FRAGCOUNT': '1.000', 'weapon3': '1.356', 'weapon2': '1.966'} +[2023-09-14 15:07:23,255][63770] DAMAGECOUNT value on done: 17354.0 +[2023-09-14 15:07:23,255][63770] Sum rewards: -1.247, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-0.869', 'AMMO5': '0.010', 'WEAPON1': '0.010', 'AMMO2': '0.031', 'ARMOR': '0.068', 'AMMO3': '0.088', 'weapon4': '0.110', 'HITCOUNT': '0.120', 'weapon5': '0.150', 'AMMO4': '0.154', 'WEAPON5': '0.200', 'WEAPON4': '0.300', 'DAMAGECOUNT': '0.387', 'WEAPON3': '0.400', 'weapon3': '0.716', 'FRAGCOUNT': '2.000', 'weapon2': '2.378'} +[2023-09-14 15:07:23,662][63770] DAMAGECOUNT value on done: 15710.0 +[2023-09-14 15:07:24,629][63771] DAMAGECOUNT value on done: 14204.0 +[2023-09-14 15:07:24,629][63771] Sum rewards: -6.756, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-2.674', 'AMMO2': '0.006', 'AMMO5': '0.020', 'AMMO4': '0.029', 'WEAPON1': '0.040', 'weapon5': '0.072', 'AMMO3': '0.185', 'HITCOUNT': '0.190', 'WEAPON4': '0.250', 'weapon4': '0.260', 'WEAPON5': '0.400', 'FRAGCOUNT': '0.500', 'ARMOR': '0.532', 'DAMAGECOUNT': '1.044', 'WEAPON3': '1.050', 'weapon2': '1.564', 'weapon3': '1.776'} +[2023-09-14 15:07:24,994][63771] DAMAGECOUNT value on done: 17464.0 +[2023-09-14 15:07:24,994][63771] Sum rewards: -4.421, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-1.302', 'AMMO5': '0.018', 'AMMO2': '0.023', 'WEAPON1': '0.040', 'weapon5': '0.042', 'weapon4': '0.064', 'ARMOR': '0.104', 'AMMO4': '0.117', 'AMMO3': '0.130', 'HITCOUNT': '0.140', 'WEAPON4': '0.200', 'WEAPON5': '0.200', 'DAMAGECOUNT': '0.465', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon3': '1.388', 'weapon2': '2.000'} +[2023-09-14 15:07:25,084][63734] DAMAGECOUNT value on done: 18131.0 +[2023-09-14 15:07:25,085][63734] Sum rewards: -0.200, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.500', 'AMMO4': '-0.004', 'AMMO2': '-0.001', 'ARMOR': '0.012', 'AMMO5': '0.024', 'weapon4': '0.024', 'WEAPON4': '0.050', 'WEAPON1': '0.060', 'AMMO3': '0.143', 'HITCOUNT': '0.250', 'WEAPON5': '0.400', 'weapon5': '0.522', 'WEAPON3': '0.800', 'DAMAGECOUNT': '1.083', 'weapon2': '1.448', 'FRAGCOUNT': '1.500', 'weapon3': '1.738'} +[2023-09-14 15:07:25,502][63734] DAMAGECOUNT value on done: 16118.0 +[2023-09-14 15:07:25,502][63734] Sum rewards: -3.107, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.340', 'AMMO2': '0.004', 'WEAPON1': '0.010', 'AMMO5': '0.020', 'AMMO4': '0.022', 'weapon5': '0.026', 'AMMO3': '0.138', 'HITCOUNT': '0.230', 'WEAPON5': '0.350', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.777', 'FRAGCOUNT': '1.000', 'weapon2': '1.220', 'weapon3': '1.936'} +[2023-09-14 15:07:25,960][63732] Updated weights for policy 0, policy_version 2420 (0.0011) +[2023-09-14 15:07:26,120][63769] DAMAGECOUNT value on done: 18652.0 +[2023-09-14 15:07:26,121][63769] Sum rewards: -1.849, reward structure: {'DEATHCOUNT': '-6.750', 'FRAGCOUNT': '-0.500', 'AMMO5': '0.005', 'WEAPON1': '0.020', 'AMMO2': '0.021', 'ARMOR': '0.033', 'weapon5': '0.068', 'AMMO3': '0.099', 'WEAPON5': '0.100', 'AMMO4': '0.104', 'HITCOUNT': '0.110', 'WEAPON4': '0.200', 'weapon4': '0.260', 'DAMAGECOUNT': '0.285', 'HEALTH': '0.446', 'WEAPON3': '0.550', 'weapon2': '1.252', 'weapon3': '1.848'} +[2023-09-14 15:07:26,432][63769] DAMAGECOUNT value on done: 13056.0 +[2023-09-14 15:07:26,432][63769] Sum rewards: 3.133, reward structure: {'DEATHCOUNT': '-4.500', 'HEALTH': '-1.430', 'AMMO5': '0.005', 'AMMO2': '0.010', 'WEAPON1': '0.020', 'AMMO4': '0.052', 'ARMOR': '0.064', 'AMMO3': '0.088', 'WEAPON4': '0.100', 'WEAPON5': '0.100', 'weapon5': '0.170', 'weapon4': '0.212', 'HITCOUNT': '0.290', 'WEAPON3': '0.650', 'weapon2': '1.198', 'DAMAGECOUNT': '1.320', 'weapon3': '1.784', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:07:26,438][63735] DAMAGECOUNT value on done: 15994.0 +[2023-09-14 15:07:26,439][63735] Sum rewards: 0.842, reward structure: {'DEATHCOUNT': '-6.000', 'HEALTH': '-0.059', 'weapon4': '0.004', 'AMMO5': '0.007', 'AMMO2': '0.038', 'WEAPON1': '0.040', 'AMMO3': '0.068', 'HITCOUNT': '0.090', 'WEAPON4': '0.100', 'WEAPON5': '0.150', 'AMMO4': '0.191', 'WEAPON3': '0.400', 'weapon5': '0.414', 'DAMAGECOUNT': '0.450', 'weapon3': '0.914', 'FRAGCOUNT': '2.000', 'weapon2': '2.034'} +[2023-09-14 15:07:26,885][63735] DAMAGECOUNT value on done: 13583.0 +[2023-09-14 15:07:26,886][63735] Sum rewards: 1.643, reward structure: {'DEATHCOUNT': '-6.750', 'AMMO5': '0.007', 'AMMO2': '0.021', 'WEAPON1': '0.030', 'HEALTH': '0.048', 'WEAPON4': '0.050', 'weapon5': '0.078', 'AMMO4': '0.105', 'AMMO3': '0.107', 'ARMOR': '0.128', 'HITCOUNT': '0.140', 'WEAPON5': '0.150', 'weapon4': '0.204', 'DAMAGECOUNT': '0.600', 'WEAPON3': '0.700', 'weapon2': '1.114', 'weapon3': '1.910', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:07:29,728][63806] DAMAGECOUNT value on done: 14719.0 +[2023-09-14 15:07:30,061][63733] Updated weights for policy 1, policy_version 2640 (0.0012) +[2023-09-14 15:07:30,144][63806] DAMAGECOUNT value on done: 16126.0 +[2023-09-14 15:07:30,144][63806] Sum rewards: -3.499, reward structure: {'DEATHCOUNT': '-10.500', 'HEALTH': '-2.052', 'AMMO2': '0.018', 'WEAPON1': '0.020', 'AMMO5': '0.026', 'weapon4': '0.078', 'AMMO4': '0.089', 'WEAPON4': '0.100', 'AMMO3': '0.239', 'HITCOUNT': '0.240', 'weapon5': '0.246', 'ARMOR': '0.400', 'WEAPON5': '0.450', 'WEAPON3': '0.900', 'DAMAGECOUNT': '0.900', 'weapon2': '1.468', 'weapon3': '1.880', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:07:31,199][63806] DAMAGECOUNT value on done: 15338.0 +[2023-09-14 15:07:31,200][63806] Sum rewards: -3.353, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-1.213', 'AMMO5': '0.015', 'AMMO2': '0.017', 'ARMOR': '0.032', 'weapon5': '0.036', 'WEAPON1': '0.050', 'AMMO4': '0.087', 'HITCOUNT': '0.090', 'weapon4': '0.094', 'WEAPON4': '0.100', 'AMMO3': '0.119', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.390', 'WEAPON3': '0.750', 'FRAGCOUNT': '1.000', 'weapon3': '1.478', 'weapon2': '1.552'} +[2023-09-14 15:07:31,562][63806] DAMAGECOUNT value on done: 15891.0 +[2023-09-14 15:07:31,562][63806] Sum rewards: -4.220, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.594', 'AMMO5': '0.005', 'AMMO2': '0.010', 'weapon5': '0.040', 'ARMOR': '0.048', 'AMMO4': '0.050', 'WEAPON1': '0.060', 'WEAPON5': '0.100', 'AMMO3': '0.109', 'HITCOUNT': '0.140', 'DAMAGECOUNT': '0.435', 'WEAPON3': '0.700', 'FRAGCOUNT': '1.000', 'weapon2': '1.622', 'weapon3': '1.804'} +[2023-09-14 15:07:32,586][63805] DAMAGECOUNT value on done: 16464.0 +[2023-09-14 15:07:32,991][63805] DAMAGECOUNT value on done: 18483.0 +[2023-09-14 15:07:33,981][63732] Updated weights for policy 0, policy_version 2430 (0.0012) +[2023-09-14 15:07:34,610][63805] DAMAGECOUNT value on done: 17163.0 +[2023-09-14 15:07:34,610][63805] Sum rewards: -6.579, reward structure: {'DEATHCOUNT': '-12.750', 'HEALTH': '-3.050', 'AMMO4': '-0.036', 'AMMO2': '-0.007', 'AMMO5': '0.031', 'WEAPON4': '0.050', 'weapon5': '0.060', 'weapon4': '0.200', 'AMMO3': '0.237', 'HITCOUNT': '0.250', 'ARMOR': '0.435', 'WEAPON5': '0.500', 'WEAPON3': '1.000', 'FRAGCOUNT': '1.500', 'DAMAGECOUNT': '1.530', 'weapon3': '1.718', 'weapon2': '1.754'} +[2023-09-14 15:07:35,066][63805] DAMAGECOUNT value on done: 14572.0 +[2023-09-14 15:07:35,066][63805] Sum rewards: -5.482, reward structure: {'DEATHCOUNT': '-11.250', 'HEALTH': '-1.746', 'ARMOR': '0.004', 'AMMO5': '0.015', 'AMMO2': '0.018', 'weapon5': '0.026', 'WEAPON1': '0.050', 'weapon4': '0.074', 'AMMO4': '0.089', 'WEAPON4': '0.100', 'AMMO3': '0.119', 'HITCOUNT': '0.150', 'WEAPON5': '0.300', 'DAMAGECOUNT': '0.405', 'WEAPON3': '0.850', 'weapon3': '1.520', 'weapon2': '1.794', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:07:35,936][63735] DAMAGECOUNT value on done: 14325.0 +[2023-09-14 15:07:35,937][63735] Sum rewards: -2.534, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.985', 'AMMO4': '-0.001', 'AMMO2': '-0.000', 'AMMO5': '0.017', 'WEAPON1': '0.020', 'weapon7': '0.090', 'WEAPON4': '0.100', 'AMMO6': '0.120', 'AMMO7': '0.120', 'weapon4': '0.122', 'AMMO3': '0.156', 'HITCOUNT': '0.180', 'WEAPON7': '0.200', 'weapon5': '0.214', 'WEAPON5': '0.350', 'ARMOR': '0.460', 'DAMAGECOUNT': '0.615', 'WEAPON3': '1.050', 'weapon2': '1.092', 'FRAGCOUNT': '1.500', 'weapon3': '2.046'} +[2023-09-14 15:07:36,274][63735] DAMAGECOUNT value on done: 18917.0 +[2023-09-14 15:07:36,275][63735] Sum rewards: -1.159, reward structure: {'DEATHCOUNT': '-8.250', 'AMMO2': '0.008', 'AMMO5': '0.010', 'ARMOR': '0.028', 'WEAPON1': '0.030', 'AMMO4': '0.039', 'WEAPON4': '0.050', 'weapon5': '0.096', 'AMMO3': '0.119', 'WEAPON5': '0.200', 'HITCOUNT': '0.240', 'HEALTH': '0.462', 'WEAPON3': '0.500', 'DAMAGECOUNT': '0.945', 'FRAGCOUNT': '1.000', 'weapon2': '1.612', 'weapon3': '1.752'} +[2023-09-14 15:07:37,191][63733] Updated weights for policy 1, policy_version 2650 (0.0011) +[2023-09-14 15:07:37,801][63767] DAMAGECOUNT value on done: 18286.0 +[2023-09-14 15:07:37,802][63767] Sum rewards: -3.925, reward structure: {'DEATHCOUNT': '-9.000', 'HEALTH': '-1.669', 'AMMO4': '-0.053', 'AMMO2': '-0.010', 'AMMO5': '0.007', 'weapon5': '0.014', 'WEAPON1': '0.020', 'ARMOR': '0.036', 'WEAPON5': '0.150', 'AMMO3': '0.184', 'HITCOUNT': '0.230', 'DAMAGECOUNT': '0.696', 'WEAPON3': '0.950', 'FRAGCOUNT': '1.000', 'weapon2': '1.246', 'weapon3': '2.274'} +[2023-09-14 15:07:38,260][63767] DAMAGECOUNT value on done: 17581.0 +[2023-09-14 15:07:38,260][63767] Sum rewards: -0.654, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-0.852', 'AMMO4': '-0.005', 'AMMO2': '-0.001', 'AMMO5': '0.005', 'WEAPON1': '0.030', 'weapon5': '0.032', 'ARMOR': '0.083', 'AMMO3': '0.084', 'WEAPON5': '0.100', 'WEAPON4': '0.100', 'HITCOUNT': '0.170', 'weapon4': '0.170', 'DAMAGECOUNT': '0.495', 'WEAPON3': '0.600', 'weapon2': '1.274', 'weapon3': '1.810', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:07:40,390][63734] DAMAGECOUNT value on done: 15466.0 +[2023-09-14 15:07:40,391][63734] Sum rewards: -4.446, reward structure: {'DEATHCOUNT': '-12.000', 'HEALTH': '-1.578', 'weapon5': '0.008', 'AMMO5': '0.010', 'weapon4': '0.012', 'AMMO2': '0.028', 'WEAPON1': '0.040', 'ARMOR': '0.044', 'AMMO4': '0.140', 'AMMO3': '0.176', 'WEAPON5': '0.200', 'HITCOUNT': '0.200', 'WEAPON4': '0.250', 'DAMAGECOUNT': '0.612', 'WEAPON3': '1.000', 'weapon2': '1.508', 'weapon3': '1.904', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:07:40,849][63734] DAMAGECOUNT value on done: 15926.0 +[2023-09-14 15:07:40,849][63734] Sum rewards: 1.286, reward structure: {'DEATHCOUNT': '-7.500', 'HEALTH': '-1.128', 'AMMO2': '0.007', 'AMMO5': '0.013', 'weapon5': '0.014', 'AMMO4': '0.036', 'weapon7': '0.050', 'AMMO3': '0.129', 'AMMO6': '0.200', 'WEAPON7': '0.200', 'AMMO7': '0.200', 'WEAPON5': '0.250', 'WEAPON4': '0.350', 'HITCOUNT': '0.370', 'ARMOR': '0.488', 'weapon4': '0.514', 'WEAPON3': '0.850', 'DAMAGECOUNT': '1.197', 'weapon3': '1.464', 'weapon2': '1.582', 'FRAGCOUNT': '2.000'} +[2023-09-14 15:07:42,175][63732] Updated weights for policy 0, policy_version 2440 (0.0011) +[2023-09-14 15:07:42,286][63769] DAMAGECOUNT value on done: 16207.0 +[2023-09-14 15:07:42,286][63769] Sum rewards: -2.318, reward structure: {'DEATHCOUNT': '-9.750', 'HEALTH': '-0.885', 'WEAPON1': '0.020', 'ARMOR': '0.020', 'weapon4': '0.024', 'AMMO2': '0.024', 'AMMO5': '0.026', 'weapon7': '0.082', 'WEAPON4': '0.100', 'AMMO4': '0.120', 'AMMO3': '0.171', 'weapon5': '0.190', 'HITCOUNT': '0.240', 'AMMO6': '0.260', 'AMMO7': '0.260', 'WEAPON7': '0.300', 'WEAPON5': '0.500', 'WEAPON3': '0.750', 'DAMAGECOUNT': '0.807', 'FRAGCOUNT': '1.000', 'weapon2': '1.196', 'weapon3': '2.228'} +[2023-09-14 15:07:42,627][63769] DAMAGECOUNT value on done: 14653.0 +[2023-09-14 15:07:42,628][63769] Sum rewards: 3.675, reward structure: {'DEATHCOUNT': '-6.750', 'HEALTH': '-1.690', 'AMMO5': '0.010', 'AMMO2': '0.023', 'WEAPON1': '0.050', 'weapon4': '0.054', 'WEAPON4': '0.100', 'AMMO4': '0.115', 'AMMO3': '0.120', 'weapon5': '0.148', 'HITCOUNT': '0.300', 'WEAPON5': '0.300', 'ARMOR': '0.506', 'WEAPON3': '0.800', 'weapon2': '1.436', 'DAMAGECOUNT': '1.449', 'weapon3': '1.704', 'FRAGCOUNT': '5.000'} +[2023-09-14 15:07:43,112][63771] DAMAGECOUNT value on done: 16043.0 +[2023-09-14 15:07:43,470][63771] DAMAGECOUNT value on done: 12806.0 +[2023-09-14 15:07:43,470][63771] Sum rewards: 0.012, reward structure: {'DEATHCOUNT': '-8.250', 'HEALTH': '-0.910', 'AMMO2': '0.005', 'WEAPON1': '0.020', 'AMMO5': '0.023', 'AMMO4': '0.026', 'ARMOR': '0.052', 'weapon7': '0.052', 'weapon5': '0.098', 'AMMO6': '0.120', 'AMMO7': '0.120', 'AMMO3': '0.138', 'HITCOUNT': '0.190', 'WEAPON7': '0.200', 'WEAPON5': '0.350', 'DAMAGECOUNT': '0.660', 'WEAPON3': '0.850', 'weapon2': '1.194', 'weapon3': '2.074', 'FRAGCOUNT': '3.000'} +[2023-09-14 15:07:44,232][63733] Updated weights for policy 1, policy_version 2660 (0.0012) +[2023-09-14 15:07:44,233][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000002660_10895360.pth... +[2023-09-14 15:07:44,233][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002442_10002432.pth... +[2023-09-14 15:07:44,239][63454] Stopping Batcher_0... +[2023-09-14 15:07:44,254][63732] Weights refcount: 2 0 +[2023-09-14 15:07:44,255][63732] Stopping InferenceWorker_p0-w0... +[2023-09-14 15:07:44,256][63732] Loop inference_proc0-0_evt_loop terminating... +[2023-09-14 15:07:44,256][63733] Weights refcount: 2 0 +[2023-09-14 15:07:44,257][63733] Stopping InferenceWorker_p1-w0... +[2023-09-14 15:07:44,258][63733] Loop inference_proc1-0_evt_loop terminating... +[2023-09-14 15:07:44,246][63576] Stopping Batcher_1... +[2023-09-14 15:07:44,260][63454] Loop batcher_evt_loop terminating... +[2023-09-14 15:07:44,270][63576] Loop batcher_evt_loop terminating... +[2023-09-14 15:07:44,294][63454] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002201_9015296.pth +[2023-09-14 15:07:44,302][63454] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p0/checkpoint_000002442_10002432.pth... +[2023-09-14 15:07:44,302][63576] Removing /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000002376_9732096.pth +[2023-09-14 15:07:44,311][63576] Saving /home/cogstack/Documents/optuna/environments/sample_factory/train_dir/default_experiment/checkpoint_p1/checkpoint_000002660_10895360.pth... +[2023-09-14 15:07:44,313][63771] Stopping RolloutWorker_w5... +[2023-09-14 15:07:44,313][63771] Loop rollout_proc5_evt_loop terminating... +[2023-09-14 15:07:44,316][63805] Stopping RolloutWorker_w6... +[2023-09-14 15:07:44,316][63805] Loop rollout_proc6_evt_loop terminating... +[2023-09-14 15:07:44,316][63770] Stopping RolloutWorker_w4... +[2023-09-14 15:07:44,317][63769] Stopping RolloutWorker_w3... +[2023-09-14 15:07:44,317][63770] Loop rollout_proc4_evt_loop terminating... +[2023-09-14 15:07:44,317][63769] Loop rollout_proc3_evt_loop terminating... +[2023-09-14 15:07:44,318][63734] Stopping RolloutWorker_w1... +[2023-09-14 15:07:44,319][63735] Stopping RolloutWorker_w0... +[2023-09-14 15:07:44,320][63734] Loop rollout_proc1_evt_loop terminating... +[2023-09-14 15:07:44,321][63767] Stopping RolloutWorker_w2... +[2023-09-14 15:07:44,321][63806] Stopping RolloutWorker_w7... +[2023-09-14 15:07:44,323][63735] Loop rollout_proc0_evt_loop terminating... +[2023-09-14 15:07:44,323][63806] Loop rollout_proc7_evt_loop terminating... +[2023-09-14 15:07:44,323][63767] Loop rollout_proc2_evt_loop terminating... +[2023-09-14 15:07:44,392][63454] Stopping LearnerWorker_p0... +[2023-09-14 15:07:44,392][63454] Loop learner_proc0_evt_loop terminating... +[2023-09-14 15:07:44,403][63576] Stopping LearnerWorker_p1... +[2023-09-14 15:07:44,403][63576] Loop learner_proc1_evt_loop terminating... diff --git a/environments/sample_factory/wandb/latest-run b/environments/sample_factory/wandb/latest-run index 569faa1..49308ae 120000 --- a/environments/sample_factory/wandb/latest-run +++ b/environments/sample_factory/wandb/latest-run @@ -1 +1 @@ -run-20230912_182125-default_experiment_20230912_165919_228624 \ No newline at end of file +run-20230914_143511-qiyz0kuy \ No newline at end of file diff --git a/environments/unity/ml-agents b/environments/unity/ml-agents --- a/environments/unity/ml-agents +++ b/environments/unity/ml-agents @@ -1 +1 @@ -Subproject commit 8bcedabd808ffb7097f88b800fc92dea82dfd610 +Subproject commit 8bcedabd808ffb7097f88b800fc92dea82dfd610-dirty